You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@cassandra.apache.org by jb...@apache.org on 2009/04/24 04:58:25 UTC

svn commit: r768135 - /incubator/cassandra/trunk/conf/storage-conf.xml

Author: jbellis
Date: Fri Apr 24 02:58:24 2009
New Revision: 768135

URL: http://svn.apache.org/viewvc?rev=768135&view=rev
Log:
Simplify default storage-conf.xml.  patch by Sandeep Tata; reviewed by jbellis for #99

Modified:
    incubator/cassandra/trunk/conf/storage-conf.xml

Modified: incubator/cassandra/trunk/conf/storage-conf.xml
URL: http://svn.apache.org/viewvc/incubator/cassandra/trunk/conf/storage-conf.xml?rev=768135&r1=768134&r2=768135&view=diff
==============================================================================
--- incubator/cassandra/trunk/conf/storage-conf.xml (original)
+++ incubator/cassandra/trunk/conf/storage-conf.xml Fri Apr 24 02:58:24 2009
@@ -1,69 +1,111 @@
 <Storage>
-   <ClusterName>Test Cluster</ClusterName>
-   <!-- any IPartitioner may be used, including your own
-        as long as it is on the classpath.  Out of the box,
-        Cassandra provides
-        org.apache.cassandra.dht.RandomPartitioner and
-        org.apache.cassandra.dht.OrderPreservingPartitioner.
-        Range queries require using OrderPreservingPartitioner or a subclass. -->
-   <Partitioner>org.apache.cassandra.dht.RandomPartitioner</Partitioner>
-   <RackAware>false</RackAware>
-   <MulticastChannel>230.0.0.1</MulticastChannel>
-   <ReplicationFactor>1</ReplicationFactor>
-   <ZookeeperAddress>127.0.0.1</ZookeeperAddress>
-   <RpcTimeoutInMillis>5000</RpcTimeoutInMillis>
-   <JobTrackerHost>tdsearch001.sf2p.facebook.com</JobTrackerHost>
-   <JobJarFileLocation>C:\Engagements\Cassandra-Nexus</JobJarFileLocation>
-   <ListenAddress>localhost</ListenAddress>
-   <StoragePort>7000</StoragePort>
-   <ControlPort>7001</ControlPort>
-   <ThriftPort>9160</ThriftPort>
-   <ColumnIndexSizeInKB>256</ColumnIndexSizeInKB>
-   <HttpPort>7002</HttpPort>
-   <MetadataDirectory>/var/cassandra/system</MetadataDirectory>
-   <CommitLogDirectory>/var/cassandra/commitlog</CommitLogDirectory>
-   <CommitLogRotationThresholdInMB>128</CommitLogRotationThresholdInMB>
-   <!-- 
-     The maximum amount of data to store in a memtable before flushing it to
-     disk. Note: There is one memtable per column family, and this threshold
-     is based solely on the amount of data stored, not actual heap memory
-     usage (there is some overhead in indexing the columns).
-   -->
-   <MemtableSizeInMB>64</MemtableSizeInMB>
-   <!--
-     The maximum number of columns in millions. Like MemtableSizeInMB above,
-     this is used to impose a limit on how large a memtable can grow before 
-     it is flushed to disk.
-   -->
-   <MemtableObjectCountInMillions>1</MemtableObjectCountInMillions>
-   <GangliaServers>
-     <GangliaServer>127.0.0.1:12000</GangliaServer>
-   </GangliaServers>
-   <DataFileDirectories>
-     <DataFileDirectory>/var/cassandra/data</DataFileDirectory>
-   </DataFileDirectories>
-   <CalloutLocation>/var/cassandra/callouts</CalloutLocation>
-   <BootstrapFileDirectory>/var/cassandra/bootstrap</BootstrapFileDirectory>
-   <StagingFileDirectory>/var/cassandra/staging</StagingFileDirectory>
-   <CommitLogFastSync>false</CommitLogFastSync>
-   <!-- Time to wait before garbage-collection deletion markers.
-        Set this to a large enough value that you are confident
-        that the deletion marker will be propagated to all replicas
-        by the time this many seconds has elapsed, even in the
-        face of hardware failures.  The default value is ten days. -->
-   <GCGraceSeconds>864000</GCGraceSeconds>
-   <Tables>
-     <Table Name = "Table1">
-       <ColumnFamily ColumnSort="Name" Name="Standard1"/>
-       <ColumnFamily ColumnSort="Name" Name="Standard2"/>
-       <ColumnFamily ColumnSort="Time" Name="StandardByTime1"/>
-       <ColumnFamily ColumnSort="Time" Name="StandardByTime2"/>
-       <ColumnFamily ColumnType="Super" ColumnSort="Name" Name="Super1"/>
-       <ColumnFamily ColumnType="Super" ColumnSort="Name" Name="Super2"/>
-     </Table>
-   </Tables>
-   <Seeds>
-     <!-- Add names of hosts that are deemed contact points -->
-     <Seed>127.0.0.1</Seed>
-   </Seeds>
+    <!--======================================================================-->
+    <!-- Basic Configuration                                                  -->
+    <!--======================================================================-->
+    <ClusterName>Test Cluster</ClusterName>
+
+    <!-- Tables and ColumnFamilies                                            -->
+    <Tables>
+        <Table Name="Table1">
+            <ColumnFamily ColumnSort="Name" Name="Standard1"/>
+            <ColumnFamily ColumnSort="Name" Name="Standard2"/>
+            <ColumnFamily ColumnSort="Time" Name="StandardByTime1"/>
+            <ColumnFamily ColumnSort="Time" Name="StandardByTime2"/>
+            <ColumnFamily ColumnType="Super" ColumnSort="Name" Name="Super1"/>
+            <ColumnFamily ColumnType="Super" ColumnSort="Name" Name="Super2"/>
+        </Table>
+    </Tables>
+
+    <!-- Partitioner: any IPartitioner may be used, including your own
+         as long as it is on the classpath.  Out of the box,
+         Cassandra provides
+         org.apache.cassandra.dht.RandomPartitioner and
+         org.apache.cassandra.dht.OrderPreservingPartitioner.
+         Range queries require using OrderPreservingPartitioner or a subclass.
+    -->
+    <Partitioner>org.apache.cassandra.dht.RandomPartitioner</Partitioner>
+
+    <!-- RackAware: Setting this to true instructs Cassandra to try and place the replicas in
+         a different rack in the same datacenter and one in a different datacenter
+    -->
+    <RackAware>false</RackAware>
+
+    <!-- Number of replicas of the data-->
+    <ReplicationFactor>1</ReplicationFactor>
+
+    <!-- Directories: Specify where Cassandra should store different data on disk
+         Keep the data disks and the CommitLog disks separate for best performance
+    -->
+    <CommitLogDirectory>/var/cassandra/commitlog</CommitLogDirectory>
+    <MetadataDirectory>/var/cassandra/system</MetadataDirectory>
+    <DataFileDirectories>
+        <DataFileDirectory>/var/cassandra/data</DataFileDirectory>
+    </DataFileDirectories>
+    <CalloutLocation>/var/cassandra/callouts</CalloutLocation>
+    <BootstrapFileDirectory>/var/cassandra/bootstrap</BootstrapFileDirectory>
+    <StagingFileDirectory>/var/cassandra/staging</StagingFileDirectory>
+
+
+    <!-- Add names of hosts that are deemed contact points. Cassandra nodes use
+         this list of hosts to find each other and learn the topology of the ring.
+    -->
+    <Seeds>
+        <Seed>127.0.0.1</Seed>
+    </Seeds>
+
+    <!-- Miscellaneous -->
+    <RpcTimeoutInMillis>5000</RpcTimeoutInMillis>
+    <CommitLogRotationThresholdInMB>128</CommitLogRotationThresholdInMB>
+    <CommitLogFastSync>false</CommitLogFastSync>
+
+    <!-- Hosts and Ports -->
+    <ListenAddress>localhost</ListenAddress>
+    <StoragePort>7000</StoragePort>
+    <ControlPort>7001</ControlPort>
+    <ThriftPort>9160</ThriftPort>
+    <HttpPort>7002</HttpPort>
+
+
+    <!--======================================================================-->
+    <!-- Memory, Disk, and Performance                                        -->
+    <!--======================================================================-->
+
+    <!-- Threshold for adding a column index in a row -->
+    <ColumnIndexSizeInKB>256</ColumnIndexSizeInKB>
+
+    <!--
+      The maximum amount of data to store in memory before flushing to
+      disk. Note: There is one memtable per column family, and this threshold
+      is based solely on the amount of data stored, not actual heap memory
+      usage (there is some overhead in indexing the columns).
+    -->
+    <MemtableSizeInMB>64</MemtableSizeInMB>
+
+    <!--
+      The maximum number of columns in millions to store in memory
+      before flushing to disk.  Use with MemtableSizeInMB to tune memory usage.
+    -->
+    <MemtableObjectCountInMillions>1</MemtableObjectCountInMillions>
+
+    <!-- Time to wait before garbage-collection deletion markers.
+         Set this to a large enough value that you are confident
+         that the deletion marker will be propagated to all replicas
+         by the time this many seconds has elapsed, even in the
+         face of hardware failures.  The default value is ten days.
+    -->
+    <GCGraceSeconds>864000</GCGraceSeconds>
+
+
+    <!--======================================================================-->
+    <!-- OPTIONAL                                                             -->
+    <!--======================================================================-->
+    <!-- This final section contains configuration information for optional
+         and experimental features in Cassandra that are not yet fully functional.
+         Basic features in Cassandra should work fine without configuring this section.
+    -->
+    <ZookeeperAddress>127.0.0.1</ZookeeperAddress>
+    <MulticastChannel>230.0.0.1</MulticastChannel>
+    <GangliaServers>
+        <GangliaServer>127.0.0.1:12000</GangliaServer>
+    </GangliaServers>
 </Storage>