You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spark.apache.org by ma...@apache.org on 2013/07/17 02:31:47 UTC
[50/50] [abbrv] git commit: Merge remote-tracking branch 'old/master'
Merge remote-tracking branch 'old/master'
Project: http://git-wip-us.apache.org/repos/asf/incubator-spark/repo
Commit: http://git-wip-us.apache.org/repos/asf/incubator-spark/commit/87d586e4
Tree: http://git-wip-us.apache.org/repos/asf/incubator-spark/tree/87d586e4
Diff: http://git-wip-us.apache.org/repos/asf/incubator-spark/diff/87d586e4
Branch: refs/heads/master
Commit: 87d586e4da63e6e1875d9cac194c6f11e1cdc653
Parents: d733527 4ff494d
Author: Matei Zaharia <ma...@eecs.berkeley.edu>
Authored: Tue Jul 16 17:30:15 2013 -0700
Committer: Matei Zaharia <ma...@eecs.berkeley.edu>
Committed: Tue Jul 16 17:30:15 2013 -0700
----------------------------------------------------------------------
.gitignore | 1 +
LICENSE | 229 +++-
NOTICE | 5 +
README.md | 2 +-
bagel/pom.xml | 17 +
bagel/src/main/scala/spark/bagel/Bagel.scala | 17 +
.../spark/bagel/examples/PageRankUtils.scala | 17 +
.../bagel/examples/WikipediaPageRank.scala | 17 +
.../examples/WikipediaPageRankStandalone.scala | 17 +
bagel/src/test/resources/log4j.properties | 19 +-
bagel/src/test/scala/bagel/BagelSuite.scala | 17 +
bin/compute-classpath.cmd | 71 ++
bin/compute-classpath.sh | 121 +++
bin/slaves.sh | 5 +-
bin/spark-config.sh | 19 +-
bin/spark-daemon.sh | 5 +-
bin/spark-daemons.sh | 17 +
bin/start-all.sh | 17 +
bin/start-master.sh | 17 +
bin/start-slave.sh | 20 +
bin/start-slaves.sh | 17 +
bin/stop-all.sh | 17 +
bin/stop-master.sh | 17 +
bin/stop-slaves.sh | 17 +
conf/fairscheduler.xml.template | 15 +
conf/spark-env.sh.template | 18 +-
core/pom.xml | 45 +-
.../apache/hadoop/mapred/HadoopMapRedUtil.scala | 17 +
.../hadoop/mapreduce/HadoopMapReduceUtil.scala | 17 +
.../scala/spark/deploy/SparkHadoopUtil.scala | 21 +
.../apache/hadoop/mapred/HadoopMapRedUtil.scala | 17 +
.../hadoop/mapreduce/HadoopMapReduceUtil.scala | 17 +
.../scala/spark/deploy/SparkHadoopUtil.scala | 37 +-
.../spark/deploy/yarn/ApplicationMaster.scala | 92 +-
.../yarn/ApplicationMasterArguments.scala | 17 +
.../scala/spark/deploy/yarn/Client.scala | 75 +-
.../spark/deploy/yarn/ClientArguments.scala | 25 +-
.../spark/deploy/yarn/WorkerRunnable.scala | 56 +-
.../deploy/yarn/YarnAllocationHandler.scala | 17 +
.../cluster/YarnClusterScheduler.scala | 17 +
.../apache/hadoop/mapred/HadoopMapRedUtil.scala | 17 +
.../hadoop/mapreduce/HadoopMapReduceUtil.scala | 17 +
.../scala/spark/deploy/SparkHadoopUtil.scala | 21 +
.../java/spark/network/netty/FileClient.java | 45 +-
.../netty/FileClientChannelInitializer.java | 17 +
.../spark/network/netty/FileClientHandler.java | 25 +
.../java/spark/network/netty/FileServer.java | 17 +
.../netty/FileServerChannelInitializer.java | 17 +
.../spark/network/netty/FileServerHandler.java | 17 +
.../java/spark/network/netty/PathResolver.java | 17 +
.../deploy/static/bootstrap-responsive.min.css | 9 -
.../spark/deploy/static/bootstrap.min.css | 9 -
.../resources/spark/deploy/static/sorttable.js | 495 ---------
.../spark/deploy/static/spark_logo.png | Bin 14233 -> 0 bytes
.../ui/static/bootstrap-responsive.min.css | 9 +
.../resources/spark/ui/static/bootstrap.min.css | 9 +
.../main/resources/spark/ui/static/sorttable.js | 495 +++++++++
.../spark/ui/static/spark-logo-77x50px-hd.png | Bin 0 -> 3536 bytes
.../resources/spark/ui/static/spark_logo.png | Bin 0 -> 14233 bytes
.../main/resources/spark/ui/static/webui.css | 49 +
core/src/main/scala/spark/Accumulators.scala | 17 +
core/src/main/scala/spark/Aggregator.scala | 17 +
.../scala/spark/BlockStoreShuffleFetcher.scala | 18 +
core/src/main/scala/spark/Cache.scala | 17 +
core/src/main/scala/spark/CacheManager.scala | 17 +
core/src/main/scala/spark/ClosureCleaner.scala | 17 +
core/src/main/scala/spark/Dependency.scala | 17 +
.../main/scala/spark/DoubleRDDFunctions.scala | 17 +
.../main/scala/spark/FetchFailedException.scala | 17 +
core/src/main/scala/spark/HadoopWriter.scala | 17 +
core/src/main/scala/spark/HttpFileServer.scala | 19 +-
core/src/main/scala/spark/HttpServer.scala | 17 +
core/src/main/scala/spark/JavaSerializer.scala | 17 +
core/src/main/scala/spark/KryoSerializer.scala | 21 +
core/src/main/scala/spark/Logging.scala | 17 +
.../src/main/scala/spark/MapOutputTracker.scala | 17 +
.../src/main/scala/spark/PairRDDFunctions.scala | 33 +-
core/src/main/scala/spark/Partition.scala | 17 +
core/src/main/scala/spark/Partitioner.scala | 17 +
core/src/main/scala/spark/RDD.scala | 84 +-
.../main/scala/spark/RDDCheckpointData.scala | 17 +
.../scala/spark/SequenceFileRDDFunctions.scala | 17 +
.../main/scala/spark/SerializableWritable.scala | 17 +
core/src/main/scala/spark/ShuffleFetcher.scala | 17 +
core/src/main/scala/spark/SizeEstimator.scala | 17 +
.../main/scala/spark/SoftReferenceCache.scala | 17 +
core/src/main/scala/spark/SparkContext.scala | 61 +-
core/src/main/scala/spark/SparkEnv.scala | 20 +-
core/src/main/scala/spark/SparkException.scala | 17 +
core/src/main/scala/spark/SparkFiles.java | 17 +
core/src/main/scala/spark/TaskContext.scala | 17 +
core/src/main/scala/spark/TaskEndReason.scala | 21 +-
core/src/main/scala/spark/TaskState.scala | 17 +
core/src/main/scala/spark/Utils.scala | 184 +++-
.../scala/spark/api/java/JavaDoubleRDD.scala | 17 +
.../main/scala/spark/api/java/JavaPairRDD.scala | 17 +
.../src/main/scala/spark/api/java/JavaRDD.scala | 17 +
.../main/scala/spark/api/java/JavaRDDLike.scala | 42 +
.../scala/spark/api/java/JavaSparkContext.scala | 17 +
.../java/JavaSparkContextVarargsWorkaround.java | 17 +
.../scala/spark/api/java/StorageLevels.java | 17 +
.../java/function/DoubleFlatMapFunction.java | 17 +
.../spark/api/java/function/DoubleFunction.java | 17 +
.../api/java/function/FlatMapFunction.scala | 17 +
.../api/java/function/FlatMapFunction2.scala | 17 +
.../scala/spark/api/java/function/Function.java | 17 +
.../spark/api/java/function/Function2.java | 17 +
.../api/java/function/PairFlatMapFunction.java | 17 +
.../spark/api/java/function/PairFunction.java | 17 +
.../spark/api/java/function/VoidFunction.scala | 19 +-
.../api/java/function/WrappedFunction1.scala | 17 +
.../api/java/function/WrappedFunction2.scala | 17 +
.../spark/api/python/PythonPartitioner.scala | 17 +
.../main/scala/spark/api/python/PythonRDD.scala | 54 +-
.../spark/api/python/PythonWorkerFactory.scala | 37 +-
.../spark/broadcast/BitTorrentBroadcast.scala | 17 +
.../main/scala/spark/broadcast/Broadcast.scala | 17 +
.../spark/broadcast/BroadcastFactory.scala | 17 +
.../scala/spark/broadcast/HttpBroadcast.scala | 17 +
.../scala/spark/broadcast/MultiTracker.scala | 17 +
.../main/scala/spark/broadcast/SourceInfo.scala | 17 +
.../scala/spark/broadcast/TreeBroadcast.scala | 17 +
.../spark/deploy/ApplicationDescription.scala | 17 +
core/src/main/scala/spark/deploy/Command.scala | 17 +
.../main/scala/spark/deploy/DeployMessage.scala | 17 +
.../main/scala/spark/deploy/ExecutorState.scala | 17 +
.../main/scala/spark/deploy/JsonProtocol.scala | 129 +--
.../scala/spark/deploy/LocalSparkCluster.scala | 18 +
core/src/main/scala/spark/deploy/WebUI.scala | 19 +-
.../main/scala/spark/deploy/client/Client.scala | 17 +
.../spark/deploy/client/ClientListener.scala | 17 +
.../scala/spark/deploy/client/TestClient.scala | 17 +
.../spark/deploy/client/TestExecutor.scala | 17 +
.../spark/deploy/master/ApplicationInfo.scala | 17 +
.../spark/deploy/master/ApplicationState.scala | 17 +
.../spark/deploy/master/ExecutorInfo.scala | 17 +
.../main/scala/spark/deploy/master/Master.scala | 39 +-
.../spark/deploy/master/MasterArguments.scala | 17 +
.../scala/spark/deploy/master/MasterWebUI.scala | 74 --
.../scala/spark/deploy/master/WorkerInfo.scala | 17 +
.../scala/spark/deploy/master/WorkerState.scala | 17 +
.../deploy/master/ui/ApplicationPage.scala | 117 ++
.../spark/deploy/master/ui/IndexPage.scala | 138 +++
.../spark/deploy/master/ui/MasterWebUI.scala | 76 ++
.../spark/deploy/worker/ExecutorRunner.scala | 49 +-
.../main/scala/spark/deploy/worker/Worker.scala | 36 +-
.../spark/deploy/worker/WorkerArguments.scala | 17 +
.../scala/spark/deploy/worker/WorkerWebUI.scala | 57 -
.../spark/deploy/worker/ui/IndexPage.scala | 117 ++
.../spark/deploy/worker/ui/WorkerWebUI.scala | 182 ++++
.../main/scala/spark/executor/Executor.scala | 66 +-
.../scala/spark/executor/ExecutorBackend.scala | 17 +
.../scala/spark/executor/ExecutorExitCode.scala | 17 +
.../spark/executor/ExecutorURLClassLoader.scala | 17 +
.../spark/executor/MesosExecutorBackend.scala | 17 +
.../executor/StandaloneExecutorBackend.scala | 17 +
.../main/scala/spark/executor/TaskMetrics.scala | 29 +-
.../scala/spark/network/BufferMessage.scala | 19 +-
.../main/scala/spark/network/Connection.scala | 17 +
.../scala/spark/network/ConnectionManager.scala | 17 +
.../spark/network/ConnectionManagerId.scala | 17 +
.../spark/network/ConnectionManagerTest.scala | 17 +
core/src/main/scala/spark/network/Message.scala | 17 +
.../main/scala/spark/network/MessageChunk.scala | 17 +
.../spark/network/MessageChunkHeader.scala | 17 +
.../main/scala/spark/network/ReceiverTest.scala | 17 +
.../main/scala/spark/network/SenderTest.scala | 17 +
.../scala/spark/network/netty/FileHeader.scala | 17 +
.../spark/network/netty/ShuffleCopier.scala | 82 +-
.../spark/network/netty/ShuffleSender.scala | 17 +
core/src/main/scala/spark/package.scala | 17 +
.../partial/ApproximateActionListener.scala | 17 +
.../spark/partial/ApproximateEvaluator.scala | 17 +
.../scala/spark/partial/BoundedDouble.scala | 17 +
.../scala/spark/partial/CountEvaluator.scala | 17 +
.../spark/partial/GroupedCountEvaluator.scala | 17 +
.../spark/partial/GroupedMeanEvaluator.scala | 17 +
.../spark/partial/GroupedSumEvaluator.scala | 17 +
.../scala/spark/partial/MeanEvaluator.scala | 17 +
.../scala/spark/partial/PartialResult.scala | 17 +
.../scala/spark/partial/StudentTCacher.scala | 17 +
.../main/scala/spark/partial/SumEvaluator.scala | 17 +
core/src/main/scala/spark/rdd/BlockRDD.scala | 17 +
.../src/main/scala/spark/rdd/CartesianRDD.scala | 17 +
.../main/scala/spark/rdd/CheckpointRDD.scala | 17 +
.../src/main/scala/spark/rdd/CoGroupedRDD.scala | 17 +
.../src/main/scala/spark/rdd/CoalescedRDD.scala | 17 +
core/src/main/scala/spark/rdd/EmptyRDD.scala | 17 +
core/src/main/scala/spark/rdd/FilteredRDD.scala | 17 +
.../main/scala/spark/rdd/FlatMappedRDD.scala | 17 +
core/src/main/scala/spark/rdd/GlommedRDD.scala | 17 +
core/src/main/scala/spark/rdd/HadoopRDD.scala | 19 +
core/src/main/scala/spark/rdd/JdbcRDD.scala | 17 +
.../main/scala/spark/rdd/MapPartitionsRDD.scala | 17 +
.../spark/rdd/MapPartitionsWithIndexRDD.scala | 17 +
core/src/main/scala/spark/rdd/MappedRDD.scala | 17 +
.../src/main/scala/spark/rdd/NewHadoopRDD.scala | 17 +
.../scala/spark/rdd/ParallelCollectionRDD.scala | 17 +
.../scala/spark/rdd/PartitionPruningRDD.scala | 17 +
core/src/main/scala/spark/rdd/PipedRDD.scala | 17 +
core/src/main/scala/spark/rdd/SampledRDD.scala | 17 +
core/src/main/scala/spark/rdd/ShuffledRDD.scala | 17 +
.../main/scala/spark/rdd/SubtractedRDD.scala | 17 +
core/src/main/scala/spark/rdd/UnionRDD.scala | 17 +
.../scala/spark/rdd/ZippedPartitionsRDD.scala | 17 +
core/src/main/scala/spark/rdd/ZippedRDD.scala | 17 +
.../main/scala/spark/scheduler/ActiveJob.scala | 17 +
.../scala/spark/scheduler/DAGScheduler.scala | 75 +-
.../spark/scheduler/DAGSchedulerEvent.scala | 17 +
.../scala/spark/scheduler/InputFormatInfo.scala | 21 +
.../scala/spark/scheduler/JobListener.scala | 17 +
.../main/scala/spark/scheduler/JobLogger.scala | 323 ++++++
.../main/scala/spark/scheduler/JobResult.scala | 19 +-
.../main/scala/spark/scheduler/JobWaiter.scala | 19 +-
.../main/scala/spark/scheduler/MapStatus.scala | 17 +
.../main/scala/spark/scheduler/ResultTask.scala | 17 +
.../scala/spark/scheduler/ShuffleMapTask.scala | 17 +
.../scala/spark/scheduler/SparkListener.scala | 68 +-
.../main/scala/spark/scheduler/SplitInfo.scala | 17 +
core/src/main/scala/spark/scheduler/Stage.scala | 23 +-
.../main/scala/spark/scheduler/StageInfo.scala | 19 +-
core/src/main/scala/spark/scheduler/Task.scala | 17 +
.../main/scala/spark/scheduler/TaskResult.scala | 17 +
.../scala/spark/scheduler/TaskScheduler.scala | 17 +
.../spark/scheduler/TaskSchedulerListener.scala | 17 +
.../main/scala/spark/scheduler/TaskSet.scala | 17 +
.../scheduler/cluster/ClusterScheduler.scala | 17 +
.../cluster/ClusterTaskSetManager.scala | 28 +-
.../scheduler/cluster/ExecutorLossReason.scala | 17 +
.../scala/spark/scheduler/cluster/Pool.scala | 17 +
.../spark/scheduler/cluster/Schedulable.scala | 17 +
.../scheduler/cluster/SchedulableBuilder.scala | 17 +
.../scheduler/cluster/SchedulerBackend.scala | 28 +-
.../scheduler/cluster/SchedulingAlgorithm.scala | 17 +
.../scheduler/cluster/SchedulingMode.scala | 17 +
.../cluster/SparkDeploySchedulerBackend.scala | 17 +
.../cluster/StandaloneClusterMessage.scala | 17 +
.../cluster/StandaloneSchedulerBackend.scala | 17 +
.../scheduler/cluster/TaskDescription.scala | 17 +
.../spark/scheduler/cluster/TaskInfo.scala | 17 +
.../scheduler/cluster/TaskSetManager.scala | 17 +
.../spark/scheduler/cluster/WorkerOffer.scala | 17 +
.../spark/scheduler/local/LocalScheduler.scala | 34 +-
.../scheduler/local/LocalTaskSetManager.scala | 18 +
.../mesos/CoarseMesosSchedulerBackend.scala | 17 +
.../scheduler/mesos/MesosSchedulerBackend.scala | 170 ++-
.../scala/spark/serializer/Serializer.scala | 17 +
.../spark/serializer/SerializerManager.scala | 17 +
.../scala/spark/storage/BlockException.scala | 17 +
.../scala/spark/storage/BlockFetchTracker.scala | 17 +
.../spark/storage/BlockFetcherIterator.scala | 73 +-
.../main/scala/spark/storage/BlockManager.scala | 17 +
.../scala/spark/storage/BlockManagerId.scala | 17 +
.../spark/storage/BlockManagerMaster.scala | 17 +
.../spark/storage/BlockManagerMasterActor.scala | 17 +
.../spark/storage/BlockManagerMessages.scala | 17 +
.../spark/storage/BlockManagerSlaveActor.scala | 17 +
.../scala/spark/storage/BlockManagerUI.scala | 79 --
.../spark/storage/BlockManagerWorker.scala | 17 +
.../main/scala/spark/storage/BlockMessage.scala | 17 +
.../scala/spark/storage/BlockMessageArray.scala | 17 +
.../scala/spark/storage/BlockObjectWriter.scala | 17 +
.../main/scala/spark/storage/BlockStore.scala | 17 +
.../main/scala/spark/storage/DiskStore.scala | 70 +-
.../main/scala/spark/storage/MemoryStore.scala | 17 +
.../main/scala/spark/storage/PutResult.scala | 17 +
.../spark/storage/ShuffleBlockManager.scala | 19 +-
.../main/scala/spark/storage/StorageLevel.scala | 17 +
.../main/scala/spark/storage/StorageUtils.scala | 28 +-
.../scala/spark/storage/ThreadingTest.scala | 17 +
core/src/main/scala/spark/ui/JettyUtils.scala | 132 +++
core/src/main/scala/spark/ui/Page.scala | 20 +
core/src/main/scala/spark/ui/SparkUI.scala | 79 ++
core/src/main/scala/spark/ui/UIUtils.scala | 135 +++
.../scala/spark/ui/UIWorkloadGenerator.scala | 88 ++
.../main/scala/spark/ui/env/EnvironmentUI.scala | 86 ++
.../main/scala/spark/ui/jobs/IndexPage.scala | 129 +++
.../scala/spark/ui/jobs/JobProgressUI.scala | 144 +++
.../main/scala/spark/ui/jobs/StagePage.scala | 131 +++
.../scala/spark/ui/storage/BlockManagerUI.scala | 41 +
.../main/scala/spark/ui/storage/IndexPage.scala | 81 ++
.../main/scala/spark/ui/storage/RDDPage.scala | 130 +++
core/src/main/scala/spark/util/AkkaUtils.scala | 59 +-
.../scala/spark/util/BoundedPriorityQueue.scala | 17 +
.../spark/util/ByteBufferInputStream.scala | 17 +
.../scala/spark/util/CompletionIterator.scala | 19 +-
.../main/scala/spark/util/Distribution.scala | 19 +-
.../src/main/scala/spark/util/IdGenerator.scala | 17 +
core/src/main/scala/spark/util/IntParam.scala | 17 +
.../src/main/scala/spark/util/MemoryParam.scala | 17 +
.../main/scala/spark/util/MetadataCleaner.scala | 17 +
.../main/scala/spark/util/NextIterator.scala | 19 +-
.../spark/util/RateLimitedOutputStream.scala | 17 +
.../scala/spark/util/SerializableBuffer.scala | 17 +
.../src/main/scala/spark/util/StatCounter.scala | 17 +
.../scala/spark/util/TimeStampedHashMap.scala | 17 +
.../scala/spark/util/TimeStampedHashSet.scala | 17 +
core/src/main/scala/spark/util/Vector.scala | 17 +
.../main/twirl/spark/common/layout.scala.html | 35 -
.../spark/deploy/master/app_details.scala.html | 38 -
.../spark/deploy/master/app_row.scala.html | 20 -
.../spark/deploy/master/app_table.scala.html | 21 -
.../spark/deploy/master/executor_row.scala.html | 15 -
.../deploy/master/executors_table.scala.html | 19 -
.../twirl/spark/deploy/master/index.scala.html | 53 -
.../spark/deploy/master/worker_row.scala.html | 14 -
.../spark/deploy/master/worker_table.scala.html | 18 -
.../spark/deploy/worker/executor_row.scala.html | 20 -
.../deploy/worker/executors_table.scala.html | 18 -
.../twirl/spark/deploy/worker/index.scala.html | 44 -
.../main/twirl/spark/storage/index.scala.html | 40 -
.../src/main/twirl/spark/storage/rdd.scala.html | 81 --
.../twirl/spark/storage/rdd_table.scala.html | 32 -
.../twirl/spark/storage/worker_table.scala.html | 24 -
core/src/test/resources/fairscheduler.xml | 18 +
core/src/test/resources/log4j.properties | 20 +-
.../src/test/scala/spark/AccumulatorSuite.scala | 17 +
core/src/test/scala/spark/BroadcastSuite.scala | 17 +
core/src/test/scala/spark/CheckpointSuite.scala | 27 +
.../test/scala/spark/ClosureCleanerSuite.scala | 17 +
.../src/test/scala/spark/DistributedSuite.scala | 19 +
core/src/test/scala/spark/DriverSuite.scala | 21 +
core/src/test/scala/spark/FailureSuite.scala | 17 +
core/src/test/scala/spark/FileServerSuite.scala | 32 +-
core/src/test/scala/spark/FileSuite.scala | 17 +
core/src/test/scala/spark/JavaAPISuite.java | 17 +
.../test/scala/spark/KryoSerializerSuite.scala | 17 +
.../test/scala/spark/LocalSparkContext.scala | 28 +-
.../scala/spark/MapOutputTrackerSuite.scala | 17 +
.../scala/spark/PairRDDFunctionsSuite.scala | 304 ++++++
.../test/scala/spark/PartitioningSuite.scala | 36 +-
core/src/test/scala/spark/PipedRDDSuite.scala | 35 +-
core/src/test/scala/spark/RDDSuite.scala | 163 ++-
.../test/scala/spark/SharedSparkContext.scala | 42 +
.../test/scala/spark/ShuffleNettySuite.scala | 17 +
core/src/test/scala/spark/ShuffleSuite.scala | 316 +-----
.../test/scala/spark/SizeEstimatorSuite.scala | 89 +-
core/src/test/scala/spark/SortingSuite.scala | 40 +-
core/src/test/scala/spark/ThreadingSuite.scala | 17 +
core/src/test/scala/spark/UnpersistSuite.scala | 47 +
core/src/test/scala/spark/UtilsSuite.scala | 119 ++-
.../scala/spark/ZippedPartitionsSuite.scala | 20 +-
.../src/test/scala/spark/rdd/JdbcRDDSuite.scala | 17 +
.../rdd/ParallelCollectionSplitSuite.scala | 17 +
.../spark/scheduler/ClusterSchedulerSuite.scala | 17 +
.../spark/scheduler/DAGSchedulerSuite.scala | 17 +
.../scala/spark/scheduler/JobLoggerSuite.scala | 121 +++
.../spark/scheduler/LocalSchedulerSuite.scala | 17 +
.../spark/scheduler/SparkListenerSuite.scala | 19 +-
.../spark/scheduler/TaskContextSuite.scala | 17 +
.../scala/spark/storage/BlockManagerSuite.scala | 17 +
core/src/test/scala/spark/ui/UISuite.scala | 46 +
.../scala/spark/util/DistributionSuite.scala | 17 +
.../scala/spark/util/NextIteratorSuite.scala | 17 +
.../util/RateLimitedOutputStreamSuite.scala | 17 +
docs/_plugins/copy_api_dirs.rb | 17 +
docs/configuration.md | 65 +-
docs/ec2-scripts.md | 5 +-
docs/python-programming-guide.md | 12 +-
docs/scala-programming-guide.md | 10 +-
docs/streaming-programming-guide.md | 4 +-
docs/tuning.md | 6 +-
ec2/spark-ec2 | 2 +
ec2/spark_ec2.py | 2 +
examples/pom.xml | 26 +
.../main/java/spark/examples/JavaHdfsLR.java | 17 +
.../main/java/spark/examples/JavaKMeans.java | 17 +
.../main/java/spark/examples/JavaLogQuery.java | 17 +
.../main/java/spark/examples/JavaSparkPi.java | 17 +
.../src/main/java/spark/examples/JavaTC.java | 17 +
.../main/java/spark/examples/JavaWordCount.java | 17 +
.../streaming/examples/JavaFlumeEventCount.java | 17 +
.../examples/JavaNetworkWordCount.java | 17 +
.../streaming/examples/JavaQueueStream.java | 17 +
.../scala/spark/examples/BroadcastTest.scala | 17 +
.../scala/spark/examples/CassandraTest.scala | 17 +
.../spark/examples/ExceptionHandlingTest.scala | 17 +
.../main/scala/spark/examples/GroupByTest.scala | 17 +
.../main/scala/spark/examples/HBaseTest.scala | 19 +-
.../main/scala/spark/examples/HdfsTest.scala | 17 +
.../main/scala/spark/examples/LocalALS.scala | 17 +
.../main/scala/spark/examples/LocalFileLR.scala | 17 +
.../main/scala/spark/examples/LocalKMeans.scala | 17 +
.../src/main/scala/spark/examples/LocalLR.scala | 17 +
.../src/main/scala/spark/examples/LocalPi.scala | 17 +
.../main/scala/spark/examples/LogQuery.scala | 17 +
.../spark/examples/MultiBroadcastTest.scala | 17 +
.../examples/SimpleSkewedGroupByTest.scala | 17 +
.../spark/examples/SkewedGroupByTest.scala | 17 +
.../main/scala/spark/examples/SparkALS.scala | 17 +
.../main/scala/spark/examples/SparkHdfsLR.scala | 17 +
.../main/scala/spark/examples/SparkKMeans.scala | 17 +
.../src/main/scala/spark/examples/SparkLR.scala | 17 +
.../src/main/scala/spark/examples/SparkPi.scala | 17 +
.../src/main/scala/spark/examples/SparkTC.scala | 17 +
.../streaming/examples/ActorWordCount.scala | 17 +
.../streaming/examples/FlumeEventCount.scala | 17 +
.../streaming/examples/HdfsWordCount.scala | 17 +
.../streaming/examples/KafkaWordCount.scala | 19 +-
.../streaming/examples/NetworkWordCount.scala | 17 +
.../spark/streaming/examples/QueueStream.scala | 17 +
.../streaming/examples/RawNetworkGrep.scala | 17 +
.../examples/StatefulNetworkWordCount.scala | 67 ++
.../streaming/examples/TwitterAlgebirdCMS.scala | 26 +-
.../streaming/examples/TwitterAlgebirdHLL.scala | 26 +-
.../streaming/examples/TwitterPopularTags.scala | 26 +-
.../streaming/examples/ZeroMQWordCount.scala | 17 +
.../clickstream/PageViewGenerator.scala | 17 +
.../examples/clickstream/PageViewStream.scala | 17 +
make-distribution.sh | 58 +
mllib/data/als/test.data | 16 +
mllib/data/lr-data/random.data | 1000 ++++++++++++++++++
mllib/data/ridge-data/lpsa.data | 67 ++
.../scala/spark/mllib/clustering/KMeans.scala | 334 ++++++
.../spark/mllib/clustering/KMeansModel.scala | 44 +
.../spark/mllib/clustering/LocalKMeans.scala | 105 ++
.../spark/mllib/optimization/Gradient.scala | 50 +
.../mllib/optimization/GradientDescent.scala | 79 ++
.../spark/mllib/optimization/Updater.scala | 44 +
.../scala/spark/mllib/recommendation/ALS.scala | 436 ++++++++
.../MatrixFactorizationModel.scala | 40 +
.../mllib/regression/LogisticRegression.scala | 175 +++
.../LogisticRegressionGenerator.scala | 58 +
.../spark/mllib/regression/Regression.scala | 38 +
.../mllib/regression/RidgeRegression.scala | 211 ++++
.../regression/RidgeRegressionGenerator.scala | 72 ++
.../main/scala/spark/mllib/util/MLUtils.scala | 112 ++
mllib/src/test/resources/log4j.properties | 28 +
.../spark/mllib/clustering/KMeansSuite.scala | 170 +++
.../spark/mllib/recommendation/ALSSuite.scala | 97 ++
.../regression/LogisticRegressionSuite.scala | 74 ++
.../mllib/regression/RidgeRegressionSuite.scala | 64 ++
pom.xml | 103 +-
project/SparkBuild.scala | 47 +-
project/build.properties | 17 +
project/plugins.sbt | 2 -
pyspark | 17 +
python/epydoc.conf | 17 +
python/examples/als.py | 17 +
python/examples/kmeans.py | 17 +
python/examples/logistic_regression.py | 17 +
python/examples/pi.py | 17 +
python/examples/transitive_closure.py | 17 +
python/examples/wordcount.py | 17 +
python/pyspark/accumulators.py | 17 +
python/pyspark/broadcast.py | 17 +
python/pyspark/context.py | 17 +
python/pyspark/daemon.py | 59 +-
python/pyspark/files.py | 17 +
python/pyspark/java_gateway.py | 17 +
python/pyspark/rdd.py | 17 +
python/pyspark/serializers.py | 17 +
python/pyspark/shell.py | 17 +
python/pyspark/tests.py | 17 +
python/pyspark/worker.py | 17 +
python/run-tests | 20 +-
repl-bin/pom.xml | 17 +
repl-bin/src/deb/bin/run | 19 +-
repl-bin/src/deb/bin/spark-executor | 17 +
repl-bin/src/deb/bin/spark-shell | 17 +
repl/pom.xml | 17 +
.../scala/spark/repl/ExecutorClassLoader.scala | 17 +
repl/src/main/scala/spark/repl/Main.scala | 17 +
repl/src/main/scala/spark/repl/SparkILoop.scala | 11 +-
repl/src/test/resources/log4j.properties | 19 +-
repl/src/test/scala/spark/repl/ReplSuite.scala | 55 +-
run | 151 ++-
run.cmd | 18 +
run2.cmd | 63 +-
sbt/sbt | 22 +-
sbt/sbt.cmd | 20 +
spark-executor | 18 +
spark-shell | 86 +-
spark-shell.cmd | 18 +
streaming/pom.xml | 21 +
.../main/scala/spark/streaming/Checkpoint.scala | 26 +-
.../main/scala/spark/streaming/DStream.scala | 26 +-
.../spark/streaming/DStreamCheckpointData.scala | 17 +
.../scala/spark/streaming/DStreamGraph.scala | 17 +
.../main/scala/spark/streaming/Duration.scala | 23 +-
.../main/scala/spark/streaming/Interval.scala | 17 +
.../src/main/scala/spark/streaming/Job.scala | 17 +
.../main/scala/spark/streaming/JobManager.scala | 17 +
.../spark/streaming/NetworkInputTracker.scala | 17 +
.../spark/streaming/PairDStreamFunctions.scala | 20 +-
.../main/scala/spark/streaming/Scheduler.scala | 17 +
.../spark/streaming/StreamingContext.scala | 77 +-
.../src/main/scala/spark/streaming/Time.scala | 19 +-
.../spark/streaming/api/java/JavaDStream.scala | 19 +-
.../streaming/api/java/JavaDStreamLike.scala | 19 +-
.../streaming/api/java/JavaPairDStream.scala | 17 +
.../api/java/JavaStreamingContext.scala | 140 ++-
.../streaming/dstream/CoGroupedDStream.scala | 17 +
.../dstream/ConstantInputDStream.scala | 19 +-
.../streaming/dstream/FileInputDStream.scala | 17 +
.../streaming/dstream/FilteredDStream.scala | 17 +
.../dstream/FlatMapValuedDStream.scala | 17 +
.../streaming/dstream/FlatMappedDStream.scala | 17 +
.../streaming/dstream/FlumeInputDStream.scala | 17 +
.../streaming/dstream/ForEachDStream.scala | 17 +
.../streaming/dstream/GlommedDStream.scala | 17 +
.../spark/streaming/dstream/InputDStream.scala | 17 +
.../streaming/dstream/KafkaInputDStream.scala | 111 +-
.../dstream/MapPartitionedDStream.scala | 17 +
.../streaming/dstream/MapValuedDStream.scala | 17 +
.../spark/streaming/dstream/MappedDStream.scala | 17 +
.../streaming/dstream/NetworkInputDStream.scala | 37 +-
.../dstream/PluggableInputDStream.scala | 17 +
.../streaming/dstream/QueueInputDStream.scala | 17 +
.../streaming/dstream/RawInputDStream.scala | 17 +
.../dstream/ReducedWindowedDStream.scala | 17 +
.../streaming/dstream/ShuffledDStream.scala | 17 +
.../streaming/dstream/SocketInputDStream.scala | 17 +
.../spark/streaming/dstream/StateDStream.scala | 17 +
.../streaming/dstream/TransformedDStream.scala | 17 +
.../streaming/dstream/TwitterInputDStream.scala | 47 +-
.../spark/streaming/dstream/UnionDStream.scala | 17 +
.../streaming/dstream/WindowedDStream.scala | 17 +
.../streaming/receivers/ActorReceiver.scala | 24 +-
.../streaming/receivers/ZeroMQReceiver.scala | 17 +
.../main/scala/spark/streaming/util/Clock.scala | 17 +
.../streaming/util/MasterFailureTest.scala | 17 +
.../spark/streaming/util/RawTextHelper.scala | 17 +
.../spark/streaming/util/RawTextSender.scala | 17 +
.../spark/streaming/util/RecurringTimer.scala | 17 +
.../test/java/spark/streaming/JavaAPISuite.java | 31 +-
.../java/spark/streaming/JavaTestUtils.scala | 19 +-
streaming/src/test/resources/log4j.properties | 19 +-
.../spark/streaming/BasicOperationsSuite.scala | 21 +-
.../scala/spark/streaming/CheckpointSuite.scala | 17 +
.../scala/spark/streaming/FailureSuite.scala | 17 +
.../spark/streaming/InputStreamsSuite.scala | 28 +
.../scala/spark/streaming/TestSuiteBase.scala | 17 +
.../spark/streaming/WindowOperationsSuite.scala | 17 +
534 files changed, 16388 insertions(+), 2690 deletions(-)
----------------------------------------------------------------------
http://git-wip-us.apache.org/repos/asf/incubator-spark/blob/87d586e4/README.md
----------------------------------------------------------------------