|
|
@@ -1,664 +0,0 @@
|
|
|
-# Cassandra storage config YAML
|
|
|
-
|
|
|
-# NOTE:
|
|
|
-# See http://wiki.apache.org/cassandra/StorageConfiguration for
|
|
|
-# full explanations of configuration directives
|
|
|
-# /NOTE
|
|
|
-
|
|
|
-# The name of the cluster. This is mainly used to prevent machines in
|
|
|
-# one logical cluster from joining another.
|
|
|
-cluster_name: 'Test Cluster'
|
|
|
-
|
|
|
-# This defines the number of tokens randomly assigned to this node on the ring
|
|
|
-# The more tokens, relative to other nodes, the larger the proportion of data
|
|
|
-# that this node will store. You probably want all nodes to have the same number
|
|
|
-# of tokens assuming they have equal hardware capability.
|
|
|
-#
|
|
|
-# If you leave this unspecified, Cassandra will use the default of 1 token for legacy compatibility,
|
|
|
-# and will use the initial_token as described below.
|
|
|
-#
|
|
|
-# Specifying initial_token will override this setting.
|
|
|
-#
|
|
|
-# If you already have a cluster with 1 token per node, and wish to migrate to
|
|
|
-# multiple tokens per node, see http://wiki.apache.org/cassandra/Operations
|
|
|
-# num_tokens: 256
|
|
|
-
|
|
|
-# If you haven't specified num_tokens, or have set it to the default of 1 then
|
|
|
-# you should always specify InitialToken when setting up a production
|
|
|
-# cluster for the first time, and often when adding capacity later.
|
|
|
-# The principle is that each node should be given an equal slice of
|
|
|
-# the token ring; see http://wiki.apache.org/cassandra/Operations
|
|
|
-# for more details.
|
|
|
-#
|
|
|
-# If blank, Cassandra will request a token bisecting the range of
|
|
|
-# the heaviest-loaded existing node. If there is no load information
|
|
|
-# available, such as is the case with a new cluster, it will pick
|
|
|
-# a random token, which will lead to hot spots.
|
|
|
-initial_token:
|
|
|
-
|
|
|
-# See http://wiki.apache.org/cassandra/HintedHandoff
|
|
|
-hinted_handoff_enabled: true
|
|
|
-# this defines the maximum amount of time a dead host will have hints
|
|
|
-# generated. After it has been dead this long, new hints for it will not be
|
|
|
-# created until it has been seen alive and gone down again.
|
|
|
-max_hint_window_in_ms: 10800000 # 3 hours
|
|
|
-# Maximum throttle in KBs per second, per delivery thread. This will be
|
|
|
-# reduced proportionally to the number of nodes in the cluster. (If there
|
|
|
-# are two nodes in the cluster, each delivery thread will use the maximum
|
|
|
-# rate; if there are three, each will throttle to half of the maximum,
|
|
|
-# since we expect two nodes to be delivering hints simultaneously.)
|
|
|
-hinted_handoff_throttle_in_kb: 1024
|
|
|
-# Number of threads with which to deliver hints;
|
|
|
-# Consider increasing this number when you have multi-dc deployments, since
|
|
|
-# cross-dc handoff tends to be slower
|
|
|
-max_hints_delivery_threads: 2
|
|
|
-
|
|
|
-# Maximum throttle in KBs per second, total. This will be
|
|
|
-# reduced proportionally to the number of nodes in the cluster.
|
|
|
-batchlog_replay_throttle_in_kb: 1024
|
|
|
-
|
|
|
-# Authentication backend, implementing IAuthenticator; used to identify users
|
|
|
-# Out of the box, Cassandra provides org.apache.cassandra.auth.{AllowAllAuthenticator,
|
|
|
-# PasswordAuthenticator}.
|
|
|
-#
|
|
|
-# - AllowAllAuthenticator performs no checks - set it to disable authentication.
|
|
|
-# - PasswordAuthenticator relies on username/password pairs to authenticate
|
|
|
-# users. It keeps usernames and hashed passwords in system_auth.credentials table.
|
|
|
-# Please increase system_auth keyspace replication factor if you use this authenticator.
|
|
|
-authenticator: AllowAllAuthenticator
|
|
|
-
|
|
|
-# Authorization backend, implementing IAuthorizer; used to limit access/provide permissions
|
|
|
-# Out of the box, Cassandra provides org.apache.cassandra.auth.{AllowAllAuthorizer,
|
|
|
-# CassandraAuthorizer}.
|
|
|
-#
|
|
|
-# - AllowAllAuthorizer allows any action to any user - set it to disable authorization.
|
|
|
-# - CassandraAuthorizer stores permissions in system_auth.permissions table. Please
|
|
|
-# increase system_auth keyspace replication factor if you use this authorizer.
|
|
|
-authorizer: AllowAllAuthorizer
|
|
|
-
|
|
|
-# Validity period for permissions cache (fetching permissions can be an
|
|
|
-# expensive operation depending on the authorizer, CassandraAuthorizer is
|
|
|
-# one example). Defaults to 2000, set to 0 to disable.
|
|
|
-# Will be disabled automatically for AllowAllAuthorizer.
|
|
|
-permissions_validity_in_ms: 2000
|
|
|
-
|
|
|
-# The partitioner is responsible for distributing rows (by key) across
|
|
|
-# nodes in the cluster. Any IPartitioner may be used, including your
|
|
|
-# own as long as it is on the classpath. Out of the box, Cassandra
|
|
|
-# provides org.apache.cassandra.dht.{Murmur3Partitioner, RandomPartitioner
|
|
|
-# ByteOrderedPartitioner, OrderPreservingPartitioner (deprecated)}.
|
|
|
-#
|
|
|
-# - RandomPartitioner distributes rows across the cluster evenly by md5.
|
|
|
-# This is the default prior to 1.2 and is retained for compatibility.
|
|
|
-# - Murmur3Partitioner is similar to RandomPartioner but uses Murmur3_128
|
|
|
-# Hash Function instead of md5. When in doubt, this is the best option.
|
|
|
-# - ByteOrderedPartitioner orders rows lexically by key bytes. BOP allows
|
|
|
-# scanning rows in key order, but the ordering can generate hot spots
|
|
|
-# for sequential insertion workloads.
|
|
|
-# - OrderPreservingPartitioner is an obsolete form of BOP, that stores
|
|
|
-# - keys in a less-efficient format and only works with keys that are
|
|
|
-# UTF8-encoded Strings.
|
|
|
-# - CollatingOPP collates according to EN,US rules rather than lexical byte
|
|
|
-# ordering. Use this as an example if you need custom collation.
|
|
|
-#
|
|
|
-# See http://wiki.apache.org/cassandra/Operations for more on
|
|
|
-# partitioners and token selection.
|
|
|
-partitioner: org.apache.cassandra.dht.Murmur3Partitioner
|
|
|
-
|
|
|
-# Directories where Cassandra should store data on disk. Cassandra
|
|
|
-# will spread data evenly across them, subject to the granularity of
|
|
|
-# the configured compaction strategy.
|
|
|
-data_file_directories:
|
|
|
- - /var/lib/cassandra/data
|
|
|
-
|
|
|
-# commit log
|
|
|
-commitlog_directory: /var/lib/cassandra/commitlog
|
|
|
-
|
|
|
-# policy for data disk failures:
|
|
|
-# stop: shut down gossip and Thrift, leaving the node effectively dead, but
|
|
|
-# can still be inspected via JMX.
|
|
|
-# best_effort: stop using the failed disk and respond to requests based on
|
|
|
-# remaining available sstables. This means you WILL see obsolete
|
|
|
-# data at CL.ONE!
|
|
|
-# ignore: ignore fatal errors and let requests fail, as in pre-1.2 Cassandra
|
|
|
-disk_failure_policy: stop
|
|
|
-
|
|
|
-# Maximum size of the key cache in memory.
|
|
|
-#
|
|
|
-# Each key cache hit saves 1 seek and each row cache hit saves 2 seeks at the
|
|
|
-# minimum, sometimes more. The key cache is fairly tiny for the amount of
|
|
|
-# time it saves, so it's worthwhile to use it at large numbers.
|
|
|
-# The row cache saves even more time, but must contain the entire row,
|
|
|
-# so it is extremely space-intensive. It's best to only use the
|
|
|
-# row cache if you have hot rows or static rows.
|
|
|
-#
|
|
|
-# NOTE: if you reduce the size, you may not get you hottest keys loaded on startup.
|
|
|
-#
|
|
|
-# Default value is empty to make it "auto" (min(5% of Heap (in MB), 100MB)). Set to 0 to disable key cache.
|
|
|
-key_cache_size_in_mb:
|
|
|
-
|
|
|
-# Duration in seconds after which Cassandra should
|
|
|
-# save the key cache. Caches are saved to saved_caches_directory as
|
|
|
-# specified in this configuration file.
|
|
|
-#
|
|
|
-# Saved caches greatly improve cold-start speeds, and is relatively cheap in
|
|
|
-# terms of I/O for the key cache. Row cache saving is much more expensive and
|
|
|
-# has limited use.
|
|
|
-#
|
|
|
-# Default is 14400 or 4 hours.
|
|
|
-key_cache_save_period: 14400
|
|
|
-
|
|
|
-# Number of keys from the key cache to save
|
|
|
-# Disabled by default, meaning all keys are going to be saved
|
|
|
-# key_cache_keys_to_save: 100
|
|
|
-
|
|
|
-# Maximum size of the row cache in memory.
|
|
|
-# NOTE: if you reduce the size, you may not get you hottest keys loaded on startup.
|
|
|
-#
|
|
|
-# Default value is 0, to disable row caching.
|
|
|
-row_cache_size_in_mb: 0
|
|
|
-
|
|
|
-# Duration in seconds after which Cassandra should
|
|
|
-# safe the row cache. Caches are saved to saved_caches_directory as specified
|
|
|
-# in this configuration file.
|
|
|
-#
|
|
|
-# Saved caches greatly improve cold-start speeds, and is relatively cheap in
|
|
|
-# terms of I/O for the key cache. Row cache saving is much more expensive and
|
|
|
-# has limited use.
|
|
|
-#
|
|
|
-# Default is 0 to disable saving the row cache.
|
|
|
-row_cache_save_period: 0
|
|
|
-
|
|
|
-# Number of keys from the row cache to save
|
|
|
-# Disabled by default, meaning all keys are going to be saved
|
|
|
-# row_cache_keys_to_save: 100
|
|
|
-
|
|
|
-
|
|
|
-# saved caches
|
|
|
-saved_caches_directory: /var/lib/cassandra/saved_caches
|
|
|
-
|
|
|
-# commitlog_sync may be either "periodic" or "batch."
|
|
|
-# When in batch mode, Cassandra won't ack writes until the commit log
|
|
|
-# has been fsynced to disk. It will wait up to
|
|
|
-# commitlog_sync_batch_window_in_ms milliseconds for other writes, before
|
|
|
-# performing the sync.
|
|
|
-#
|
|
|
-# commitlog_sync: batch
|
|
|
-# commitlog_sync_batch_window_in_ms: 50
|
|
|
-#
|
|
|
-# the other option is "periodic" where writes may be acked immediately
|
|
|
-# and the CommitLog is simply synced every commitlog_sync_period_in_ms
|
|
|
-# milliseconds. By default this allows 1024*(CPU cores) pending
|
|
|
-# entries on the commitlog queue. If you are writing very large blobs,
|
|
|
-# you should reduce that; 16*cores works reasonably well for 1MB blobs.
|
|
|
-# It should be at least as large as the concurrent_writes setting.
|
|
|
-commitlog_sync: periodic
|
|
|
-commitlog_sync_period_in_ms: 10000
|
|
|
-# commitlog_periodic_queue_size:
|
|
|
-
|
|
|
-# The size of the individual commitlog file segments. A commitlog
|
|
|
-# segment may be archived, deleted, or recycled once all the data
|
|
|
-# in it (potentially from each columnfamily in the system) has been
|
|
|
-# flushed to sstables.
|
|
|
-#
|
|
|
-# The default size is 32, which is almost always fine, but if you are
|
|
|
-# archiving commitlog segments (see commitlog_archiving.properties),
|
|
|
-# then you probably want a finer granularity of archiving; 8 or 16 MB
|
|
|
-# is reasonable.
|
|
|
-commitlog_segment_size_in_mb: 32
|
|
|
-
|
|
|
-# any class that implements the SeedProvider interface and has a
|
|
|
-# constructor that takes a Map<String, String> of parameters will do.
|
|
|
-seed_provider:
|
|
|
- # Addresses of hosts that are deemed contact points.
|
|
|
- # Cassandra nodes use this list of hosts to find each other and learn
|
|
|
- # the topology of the ring. You must change this if you are running
|
|
|
- # multiple nodes!
|
|
|
- - class_name: org.apache.cassandra.locator.SimpleSeedProvider
|
|
|
- parameters:
|
|
|
- # seeds is actually a comma-delimited list of addresses.
|
|
|
- # Ex: "<ip1>,<ip2>,<ip3>"
|
|
|
- - seeds: "127.0.0.1"
|
|
|
-
|
|
|
-# emergency pressure valve #2: the first time heap usage after a full
|
|
|
-# (CMS) garbage collection is above this fraction of the max,
|
|
|
-# Cassandra will reduce cache maximum _capacity_ to the given fraction
|
|
|
-# of the current _size_. Should usually be set substantially above
|
|
|
-# flush_largest_memtables_at, since that will have less long-term
|
|
|
-# impact on the system.
|
|
|
-#
|
|
|
-
|
|
|
-# For workloads with more data than can fit in memory, Cassandra's
|
|
|
-# bottleneck will be reads that need to fetch data from
|
|
|
-# disk. "concurrent_reads" should be set to (16 * number_of_drives) in
|
|
|
-# order to allow the operations to enqueue low enough in the stack
|
|
|
-# that the OS and drives can reorder them.
|
|
|
-#
|
|
|
-# On the other hand, since writes are almost never IO bound, the ideal
|
|
|
-# number of "concurrent_writes" is dependent on the number of cores in
|
|
|
-# your system; (8 * number_of_cores) is a good rule of thumb.
|
|
|
-concurrent_reads: 32
|
|
|
-concurrent_writes: 32
|
|
|
-
|
|
|
-# Total memory to use for memtables. Cassandra will flush the largest
|
|
|
-# memtable when this much memory is used.
|
|
|
-# If omitted, Cassandra will set it to 1/3 of the heap.
|
|
|
-# memtable_total_space_in_mb: 2048
|
|
|
-
|
|
|
-# Total space to use for commitlogs. Since commitlog segments are
|
|
|
-# mmapped, and hence use up address space, the default size is 32
|
|
|
-# on 32-bit JVMs, and 1024 on 64-bit JVMs.
|
|
|
-#
|
|
|
-# If space gets above this value (it will round up to the next nearest
|
|
|
-# segment multiple), Cassandra will flush every dirty CF in the oldest
|
|
|
-# segment and remove it. So a small total commitlog space will tend
|
|
|
-# to cause more flush activity on less-active columnfamilies.
|
|
|
-# commitlog_total_space_in_mb: 4096
|
|
|
-
|
|
|
-# This sets the amount of memtable flush writer threads. These will
|
|
|
-# be blocked by disk io, and each one will hold a memtable in memory
|
|
|
-# while blocked. If you have a large heap and many data directories,
|
|
|
-# you can increase this value for better flush performance.
|
|
|
-# By default this will be set to the amount of data directories defined.
|
|
|
-#memtable_flush_writers: 1
|
|
|
-
|
|
|
-# the number of full memtables to allow pending flush, that is,
|
|
|
-# waiting for a writer thread. At a minimum, this should be set to
|
|
|
-# the maximum number of secondary indexes created on a single CF.
|
|
|
-memtable_flush_queue_size: 4
|
|
|
-
|
|
|
-# Whether to, when doing sequential writing, fsync() at intervals in
|
|
|
-# order to force the operating system to flush the dirty
|
|
|
-# buffers. Enable this to avoid sudden dirty buffer flushing from
|
|
|
-# impacting read latencies. Almost always a good idea on SSDs; not
|
|
|
-# necessarily on platters.
|
|
|
-trickle_fsync: false
|
|
|
-trickle_fsync_interval_in_kb: 10240
|
|
|
-
|
|
|
-# TCP port, for commands and data
|
|
|
-storage_port: 7000
|
|
|
-
|
|
|
-# SSL port, for encrypted communication. Unused unless enabled in
|
|
|
-# encryption_options
|
|
|
-ssl_storage_port: 7001
|
|
|
-
|
|
|
-# Address to bind to and tell other Cassandra nodes to connect to. You
|
|
|
-# _must_ change this if you want multiple nodes to be able to
|
|
|
-# communicate!
|
|
|
-#
|
|
|
-# Leaving it blank leaves it up to InetAddress.getLocalHost(). This
|
|
|
-# will always do the Right Thing _if_ the node is properly configured
|
|
|
-# (hostname, name resolution, etc), and the Right Thing is to use the
|
|
|
-# address associated with the hostname (it might not be).
|
|
|
-#
|
|
|
-# Setting this to 0.0.0.0 is always wrong.
|
|
|
-listen_address: localhost
|
|
|
-
|
|
|
-# Address to broadcast to other Cassandra nodes
|
|
|
-# Leaving this blank will set it to the same value as listen_address
|
|
|
-# broadcast_address: 1.2.3.4
|
|
|
-
|
|
|
-# Internode authentication backend, implementing IInternodeAuthenticator;
|
|
|
-# used to allow/disallow connections from peer nodes.
|
|
|
-# internode_authenticator: org.apache.cassandra.auth.AllowAllInternodeAuthenticator
|
|
|
-
|
|
|
-# Whether to start the native transport server.
|
|
|
-# Please note that the address on which the native transport is bound is the
|
|
|
-# same as the rpc_address. The port however is different and specified below.
|
|
|
-start_native_transport: true
|
|
|
-# port for the CQL native transport to listen for clients on
|
|
|
-native_transport_port: 9042
|
|
|
-# The minimum and maximum threads for handling requests when the native
|
|
|
-# transport is used. They are similar to rpc_min_threads and rpc_max_threads,
|
|
|
-# though the defaults differ slightly.
|
|
|
-# NOTE: native_transport_min_threads is now deprecated and ignored (but kept
|
|
|
-# in the 1.2.x series for compatibility sake).
|
|
|
-# native_transport_min_threads: 16
|
|
|
-# native_transport_max_threads: 128
|
|
|
-
|
|
|
-# Whether to start the thrift rpc server.
|
|
|
-start_rpc: true
|
|
|
-
|
|
|
-# The address to bind the Thrift RPC service and native transport
|
|
|
-# server -- clients connect here.
|
|
|
-#
|
|
|
-# Leaving this blank has the same effect it does for ListenAddress,
|
|
|
-# (i.e. it will be based on the configured hostname of the node).
|
|
|
-#
|
|
|
-# Note that unlike ListenAddress above, it is allowed to specify 0.0.0.0
|
|
|
-# here if you want to listen on all interfaces, but that will break clients
|
|
|
-# that rely on node auto-discovery.
|
|
|
-rpc_address: localhost
|
|
|
-# port for Thrift to listen for clients on
|
|
|
-rpc_port: 9160
|
|
|
-
|
|
|
-# enable or disable keepalive on rpc/native connections
|
|
|
-rpc_keepalive: true
|
|
|
-
|
|
|
-# Cassandra provides three out-of-the-box options for the RPC Server:
|
|
|
-#
|
|
|
-# sync -> One thread per thrift connection. For a very large number of clients, memory
|
|
|
-# will be your limiting factor. On a 64 bit JVM, 180KB is the minimum stack size
|
|
|
-# per thread, and that will correspond to your use of virtual memory (but physical memory
|
|
|
-# may be limited depending on use of stack space).
|
|
|
-#
|
|
|
-# hsha -> Stands for "half synchronous, half asynchronous." All thrift clients are handled
|
|
|
-# asynchronously using a small number of threads that does not vary with the amount
|
|
|
-# of thrift clients (and thus scales well to many clients). The rpc requests are still
|
|
|
-# synchronous (one thread per active request).
|
|
|
-#
|
|
|
-# The default is sync because on Windows hsha is about 30% slower. On Linux,
|
|
|
-# sync/hsha performance is about the same, with hsha of course using less memory.
|
|
|
-#
|
|
|
-# Alternatively, can provide your own RPC server by providing the fully-qualified class name
|
|
|
-# of an o.a.c.t.TServerFactory that can create an instance of it.
|
|
|
-rpc_server_type: sync
|
|
|
-
|
|
|
-# Uncomment rpc_min|max_thread to set request pool size limits.
|
|
|
-#
|
|
|
-# Regardless of your choice of RPC server (see above), the number of maximum requests in the
|
|
|
-# RPC thread pool dictates how many concurrent requests are possible (but if you are using the sync
|
|
|
-# RPC server, it also dictates the number of clients that can be connected at all).
|
|
|
-#
|
|
|
-# The default is unlimited and thus provides no protection against clients overwhelming the server. You are
|
|
|
-# encouraged to set a maximum that makes sense for you in production, but do keep in mind that
|
|
|
-# rpc_max_threads represents the maximum number of client requests this server may execute concurrently.
|
|
|
-#
|
|
|
-# rpc_min_threads: 16
|
|
|
-# rpc_max_threads: 2048
|
|
|
-
|
|
|
-# uncomment to set socket buffer sizes on rpc connections
|
|
|
-# rpc_send_buff_size_in_bytes:
|
|
|
-# rpc_recv_buff_size_in_bytes:
|
|
|
-
|
|
|
-# Uncomment to set socket buffer size for internode communication
|
|
|
-# Note that when setting this, the buffer size is limited by net.core.wmem_max
|
|
|
-# and when not setting it it is defined by net.ipv4.tcp_wmem
|
|
|
-# See:
|
|
|
-# /proc/sys/net/core/wmem_max
|
|
|
-# /proc/sys/net/core/rmem_max
|
|
|
-# /proc/sys/net/ipv4/tcp_wmem
|
|
|
-# /proc/sys/net/ipv4/tcp_wmem
|
|
|
-# and: man tcp
|
|
|
-# internode_send_buff_size_in_bytes:
|
|
|
-# internode_recv_buff_size_in_bytes:
|
|
|
-
|
|
|
-# Frame size for thrift (maximum message length).
|
|
|
-thrift_framed_transport_size_in_mb: 15
|
|
|
-
|
|
|
-# Set to true to have Cassandra create a hard link to each sstable
|
|
|
-# flushed or streamed locally in a backups/ subdirectory of the
|
|
|
-# keyspace data. Removing these links is the operator's
|
|
|
-# responsibility.
|
|
|
-incremental_backups: false
|
|
|
-
|
|
|
-# Whether or not to take a snapshot before each compaction. Be
|
|
|
-# careful using this option, since Cassandra won't clean up the
|
|
|
-# snapshots for you. Mostly useful if you're paranoid when there
|
|
|
-# is a data format change.
|
|
|
-snapshot_before_compaction: false
|
|
|
-
|
|
|
-# Whether or not a snapshot is taken of the data before keyspace truncation
|
|
|
-# or dropping of column families. The STRONGLY advised default of true
|
|
|
-# should be used to provide data safety. If you set this flag to false, you will
|
|
|
-# lose data on truncation or drop.
|
|
|
-auto_snapshot: true
|
|
|
-
|
|
|
-# Add column indexes to a row after its contents reach this size.
|
|
|
-# Increase if your column values are large, or if you have a very large
|
|
|
-# number of columns. The competing causes are, Cassandra has to
|
|
|
-# deserialize this much of the row to read a single column, so you want
|
|
|
-# it to be small - at least if you do many partial-row reads - but all
|
|
|
-# the index data is read for each access, so you don't want to generate
|
|
|
-# that wastefully either.
|
|
|
-column_index_size_in_kb: 64
|
|
|
-
|
|
|
-# Size limit for rows being compacted in memory. Larger rows will spill
|
|
|
-# over to disk and use a slower two-pass compaction process. A message
|
|
|
-# will be logged specifying the row key.
|
|
|
-in_memory_compaction_limit_in_mb: 64
|
|
|
-
|
|
|
-# Number of simultaneous compactions to allow, NOT including
|
|
|
-# validation "compactions" for anti-entropy repair. Simultaneous
|
|
|
-# compactions can help preserve read performance in a mixed read/write
|
|
|
-# workload, by mitigating the tendency of small sstables to accumulate
|
|
|
-# during a single long running compactions. The default is usually
|
|
|
-# fine and if you experience problems with compaction running too
|
|
|
-# slowly or too fast, you should look at
|
|
|
-# compaction_throughput_mb_per_sec first.
|
|
|
-#
|
|
|
-# concurrent_compactors defaults to the number of cores.
|
|
|
-# Uncomment to make compaction mono-threaded, the pre-0.8 default.
|
|
|
-#concurrent_compactors: 1
|
|
|
-
|
|
|
-# Multi-threaded compaction. When enabled, each compaction will use
|
|
|
-# up to one thread per core, plus one thread per sstable being merged.
|
|
|
-# This is usually only useful for SSD-based hardware: otherwise,
|
|
|
-# your concern is usually to get compaction to do LESS i/o (see:
|
|
|
-# compaction_throughput_mb_per_sec), not more.
|
|
|
-multithreaded_compaction: false
|
|
|
-
|
|
|
-# Throttles compaction to the given total throughput across the entire
|
|
|
-# system. The faster you insert data, the faster you need to compact in
|
|
|
-# order to keep the sstable count down, but in general, setting this to
|
|
|
-# 16 to 32 times the rate you are inserting data is more than sufficient.
|
|
|
-# Setting this to 0 disables throttling. Note that this account for all types
|
|
|
-# of compaction, including validation compaction.
|
|
|
-compaction_throughput_mb_per_sec: 16
|
|
|
-
|
|
|
-# Track cached row keys during compaction, and re-cache their new
|
|
|
-# positions in the compacted sstable. Disable if you use really large
|
|
|
-# key caches.
|
|
|
-compaction_preheat_key_cache: true
|
|
|
-
|
|
|
-# Throttles all outbound streaming file transfers on this node to the
|
|
|
-# given total throughput in Mbps. This is necessary because Cassandra does
|
|
|
-# mostly sequential IO when streaming data during bootstrap or repair, which
|
|
|
-# can lead to saturating the network connection and degrading rpc performance.
|
|
|
-# When unset, the default is 200 Mbps or 25 MB/s.
|
|
|
-# stream_throughput_outbound_megabits_per_sec: 200
|
|
|
-
|
|
|
-# How long the coordinator should wait for read operations to complete
|
|
|
-read_request_timeout_in_ms: 10000
|
|
|
-# How long the coordinator should wait for seq or index scans to complete
|
|
|
-range_request_timeout_in_ms: 10000
|
|
|
-# How long the coordinator should wait for writes to complete
|
|
|
-write_request_timeout_in_ms: 10000
|
|
|
-# How long the coordinator should wait for truncates to complete
|
|
|
-# (This can be much longer, because unless auto_snapshot is disabled
|
|
|
-# we need to flush first so we can snapshot before removing the data.)
|
|
|
-truncate_request_timeout_in_ms: 60000
|
|
|
-# The default timeout for other, miscellaneous operations
|
|
|
-request_timeout_in_ms: 10000
|
|
|
-
|
|
|
-# Enable operation timeout information exchange between nodes to accurately
|
|
|
-# measure request timeouts, If disabled cassandra will assuming the request
|
|
|
-# was forwarded to the replica instantly by the coordinator
|
|
|
-#
|
|
|
-# Warning: before enabling this property make sure to ntp is installed
|
|
|
-# and the times are synchronized between the nodes.
|
|
|
-cross_node_timeout: false
|
|
|
-
|
|
|
-# Enable socket timeout for streaming operation.
|
|
|
-# When a timeout occurs during streaming, streaming is retried from the start
|
|
|
-# of the current file. This _can_ involve re-streaming an important amount of
|
|
|
-# data, so you should avoid setting the value too low.
|
|
|
-# Default value is 0, which never timeout streams.
|
|
|
-# streaming_socket_timeout_in_ms: 0
|
|
|
-
|
|
|
-# phi value that must be reached for a host to be marked down.
|
|
|
-# most users should never need to adjust this.
|
|
|
-# phi_convict_threshold: 8
|
|
|
-
|
|
|
-# endpoint_snitch -- Set this to a class that implements
|
|
|
-# IEndpointSnitch. The snitch has two functions:
|
|
|
-# - it teaches Cassandra enough about your network topology to route
|
|
|
-# requests efficiently
|
|
|
-# - it allows Cassandra to spread replicas around your cluster to avoid
|
|
|
-# correlated failures. It does this by grouping machines into
|
|
|
-# "datacenters" and "racks." Cassandra will do its best not to have
|
|
|
-# more than one replica on the same "rack" (which may not actually
|
|
|
-# be a physical location)
|
|
|
-#
|
|
|
-# IF YOU CHANGE THE SNITCH AFTER DATA IS INSERTED INTO THE CLUSTER,
|
|
|
-# YOU MUST RUN A FULL REPAIR, SINCE THE SNITCH AFFECTS WHERE REPLICAS
|
|
|
-# ARE PLACED.
|
|
|
-#
|
|
|
-# Out of the box, Cassandra provides
|
|
|
-# - SimpleSnitch:
|
|
|
-# Treats Strategy order as proximity. This improves cache locality
|
|
|
-# when disabling read repair, which can further improve throughput.
|
|
|
-# Only appropriate for single-datacenter deployments.
|
|
|
-# - PropertyFileSnitch:
|
|
|
-# Proximity is determined by rack and data center, which are
|
|
|
-# explicitly configured in cassandra-topology.properties.
|
|
|
-# - GossipingPropertyFileSnitch
|
|
|
-# The rack and datacenter for the local node are defined in
|
|
|
-# cassandra-rackdc.properties and propagated to other nodes via gossip. If
|
|
|
-# cassandra-topology.properties exists, it is used as a fallback, allowing
|
|
|
-# migration from the PropertyFileSnitch.
|
|
|
-# - RackInferringSnitch:
|
|
|
-# Proximity is determined by rack and data center, which are
|
|
|
-# assumed to correspond to the 3rd and 2nd octet of each node's
|
|
|
-# IP address, respectively. Unless this happens to match your
|
|
|
-# deployment conventions (as it did Facebook's), this is best used
|
|
|
-# as an example of writing a custom Snitch class.
|
|
|
-# - Ec2Snitch:
|
|
|
-# Appropriate for EC2 deployments in a single Region. Loads Region
|
|
|
-# and Availability Zone information from the EC2 API. The Region is
|
|
|
-# treated as the datacenter, and the Availability Zone as the rack.
|
|
|
-# Only private IPs are used, so this will not work across multiple
|
|
|
-# Regions.
|
|
|
-# - Ec2MultiRegionSnitch:
|
|
|
-# Uses public IPs as broadcast_address to allow cross-region
|
|
|
-# connectivity. (Thus, you should set seed addresses to the public
|
|
|
-# IP as well.) You will need to open the storage_port or
|
|
|
-# ssl_storage_port on the public IP firewall. (For intra-Region
|
|
|
-# traffic, Cassandra will switch to the private IP after
|
|
|
-# establishing a connection.)
|
|
|
-#
|
|
|
-# You can use a custom Snitch by setting this to the full class name
|
|
|
-# of the snitch, which will be assumed to be on your classpath.
|
|
|
-endpoint_snitch: SimpleSnitch
|
|
|
-
|
|
|
-# controls how often to perform the more expensive part of host score
|
|
|
-# calculation
|
|
|
-dynamic_snitch_update_interval_in_ms: 100
|
|
|
-# controls how often to reset all host scores, allowing a bad host to
|
|
|
-# possibly recover
|
|
|
-dynamic_snitch_reset_interval_in_ms: 600000
|
|
|
-# if set greater than zero and read_repair_chance is < 1.0, this will allow
|
|
|
-# 'pinning' of replicas to hosts in order to increase cache capacity.
|
|
|
-# The badness threshold will control how much worse the pinned host has to be
|
|
|
-# before the dynamic snitch will prefer other replicas over it. This is
|
|
|
-# expressed as a double which represents a percentage. Thus, a value of
|
|
|
-# 0.2 means Cassandra would continue to prefer the static snitch values
|
|
|
-# until the pinned host was 20% worse than the fastest.
|
|
|
-dynamic_snitch_badness_threshold: 0.1
|
|
|
-
|
|
|
-# request_scheduler -- Set this to a class that implements
|
|
|
-# RequestScheduler, which will schedule incoming client requests
|
|
|
-# according to the specific policy. This is useful for multi-tenancy
|
|
|
-# with a single Cassandra cluster.
|
|
|
-# NOTE: This is specifically for requests from the client and does
|
|
|
-# not affect inter node communication.
|
|
|
-# org.apache.cassandra.scheduler.NoScheduler - No scheduling takes place
|
|
|
-# org.apache.cassandra.scheduler.RoundRobinScheduler - Round robin of
|
|
|
-# client requests to a node with a separate queue for each
|
|
|
-# request_scheduler_id. The scheduler is further customized by
|
|
|
-# request_scheduler_options as described below.
|
|
|
-request_scheduler: org.apache.cassandra.scheduler.NoScheduler
|
|
|
-
|
|
|
-# Scheduler Options vary based on the type of scheduler
|
|
|
-# NoScheduler - Has no options
|
|
|
-# RoundRobin
|
|
|
-# - throttle_limit -- The throttle_limit is the number of in-flight
|
|
|
-# requests per client. Requests beyond
|
|
|
-# that limit are queued up until
|
|
|
-# running requests can complete.
|
|
|
-# The value of 80 here is twice the number of
|
|
|
-# concurrent_reads + concurrent_writes.
|
|
|
-# - default_weight -- default_weight is optional and allows for
|
|
|
-# overriding the default which is 1.
|
|
|
-# - weights -- Weights are optional and will default to 1 or the
|
|
|
-# overridden default_weight. The weight translates into how
|
|
|
-# many requests are handled during each turn of the
|
|
|
-# RoundRobin, based on the scheduler id.
|
|
|
-#
|
|
|
-# request_scheduler_options:
|
|
|
-# throttle_limit: 80
|
|
|
-# default_weight: 5
|
|
|
-# weights:
|
|
|
-# Keyspace1: 1
|
|
|
-# Keyspace2: 5
|
|
|
-
|
|
|
-# request_scheduler_id -- An identifier based on which to perform
|
|
|
-# the request scheduling. Currently the only valid option is keyspace.
|
|
|
-# request_scheduler_id: keyspace
|
|
|
-
|
|
|
-# index_interval controls the sampling of entries from the primrary
|
|
|
-# row index in terms of space versus time. The larger the interval,
|
|
|
-# the smaller and less effective the sampling will be. In technicial
|
|
|
-# terms, the interval coresponds to the number of index entries that
|
|
|
-# are skipped between taking each sample. All the sampled entries
|
|
|
-# must fit in memory. Generally, a value between 128 and 512 here
|
|
|
-# coupled with a large key cache size on CFs results in the best trade
|
|
|
-# offs. This value is not often changed, however if you have many
|
|
|
-# very small rows (many to an OS page), then increasing this will
|
|
|
-# often lower memory usage without a impact on performance.
|
|
|
-index_interval: 128
|
|
|
-
|
|
|
-# Enable or disable inter-node encryption
|
|
|
-# Default settings are TLS v1, RSA 1024-bit keys (it is imperative that
|
|
|
-# users generate their own keys) TLS_RSA_WITH_AES_128_CBC_SHA as the cipher
|
|
|
-# suite for authentication, key exchange and encryption of the actual data transfers.
|
|
|
-# Use the DHE/ECDHE ciphers if running in FIPS 140 compliant mode.
|
|
|
-# NOTE: No custom encryption options are enabled at the moment
|
|
|
-# The available internode options are : all, none, dc, rack
|
|
|
-#
|
|
|
-# If set to dc cassandra will encrypt the traffic between the DCs
|
|
|
-# If set to rack cassandra will encrypt the traffic between the racks
|
|
|
-#
|
|
|
-# The passwords used in these options must match the passwords used when generating
|
|
|
-# the keystore and truststore. For instructions on generating these files, see:
|
|
|
-# http://download.oracle.com/javase/6/docs/technotes/guides/security/jsse/JSSERefGuide.html#CreateKeystore
|
|
|
-#
|
|
|
-server_encryption_options:
|
|
|
- internode_encryption: none
|
|
|
- keystore: conf/.keystore
|
|
|
- keystore_password: cassandra
|
|
|
- truststore: conf/.truststore
|
|
|
- truststore_password: cassandra
|
|
|
- # More advanced defaults below:
|
|
|
- # protocol: TLS
|
|
|
- # algorithm: SunX509
|
|
|
- # store_type: JKS
|
|
|
- # cipher_suites: [TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA,TLS_DHE_RSA_WITH_AES_128_CBC_SHA,TLS_DHE_RSA_WITH_AES_256_CBC_SHA,TLS_ECDHE_RSA_WITH_AES_128_CBC_SHA,TLS_ECDHE_RSA_WITH_AES_256_CBC_SHA]
|
|
|
- # require_client_auth: false
|
|
|
-
|
|
|
-# enable or disable client/server encryption.
|
|
|
-client_encryption_options:
|
|
|
- enabled: true
|
|
|
- keystore: testdata/pki/.keystore
|
|
|
- keystore_password: cassandra
|
|
|
- require_client_auth: true
|
|
|
- # Set trustore and truststore_password if require_client_auth is true
|
|
|
- truststore: testdata/pki/.truststore
|
|
|
- truststore_password: cassandra
|
|
|
- # More advanced defaults below:
|
|
|
- # protocol: TLS
|
|
|
- # algorithm: SunX509
|
|
|
- # store_type: JKS
|
|
|
-
|
|
|
-# internode_compression controls whether traffic between nodes is
|
|
|
-# compressed.
|
|
|
-# can be: all - all traffic is compressed
|
|
|
-# dc - traffic between different datacenters is compressed
|
|
|
-# none - nothing is compressed.
|
|
|
-internode_compression: all
|
|
|
-
|
|
|
-# Enable or disable tcp_nodelay for inter-dc communication.
|
|
|
-# Disabling it will result in larger (but fewer) network packets being sent,
|
|
|
-# reducing overhead from the TCP protocol itself, at the cost of increasing
|
|
|
-# latency if you block for cross-datacenter responses.
|
|
|
-inter_dc_tcp_nodelay: true
|