config.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256
  1. package sarama
  2. import (
  3. "crypto/tls"
  4. "time"
  5. )
  6. // Config is used to pass multiple configuration options to Sarama's constructors.
  7. type Config struct {
  8. // Net is the namespace for network-level properties used by the Broker, and shared by the Client/Producer/Consumer.
  9. Net struct {
  10. MaxOpenRequests int // How many outstanding requests a connection is allowed to have before sending on it blocks (default 5).
  11. // All three of the below configurations are similar to the `socket.timeout.ms` setting in JVM kafka.
  12. DialTimeout time.Duration // How long to wait for the initial connection to succeed before timing out and returning an error (default 30s).
  13. ReadTimeout time.Duration // How long to wait for a response before timing out and returning an error (default 30s).
  14. WriteTimeout time.Duration // How long to wait for a transmit to succeed before timing out and returning an error (default 30s).
  15. TLS struct {
  16. Enable bool // Whether or not to use TLS when connecting to the broker (defaults to false).
  17. Config *tls.Config // The TLS configuration to use for secure connections if enabled (defaults to nil).
  18. }
  19. }
  20. // Metadata is the namespace for metadata management properties used by the Client, and shared by the Producer/Consumer.
  21. Metadata struct {
  22. Retry struct {
  23. Max int // The total number of times to retry a metadata request when the cluster is in the middle of a leader election (default 3).
  24. Backoff time.Duration // How long to wait for leader election to occur before retrying (default 250ms). Similar to the JVM's `retry.backoff.ms`.
  25. }
  26. // How frequently to refresh the cluster metadata in the background. Defaults to 10 minutes.
  27. // Set to 0 to disable. Similar to `topic.metadata.refresh.interval.ms` in the JVM version.
  28. RefreshFrequency time.Duration
  29. }
  30. // Producer is the namespace for configuration related to producing messages, used by the Producer.
  31. Producer struct {
  32. // The maximum permitted size of a message (defaults to 1000000). Should be set equal to or smaller than the broker's `message.max.bytes`.
  33. MaxMessageBytes int
  34. // The level of acknowledgement reliability needed from the broker (defaults to WaitForLocal).
  35. // Equivalent to the `request.required.acks` setting of the JVM producer.
  36. RequiredAcks RequiredAcks
  37. // The maximum duration the broker will wait the receipt of the number of RequiredAcks (defaults to 10 seconds).
  38. // This is only relevant when RequiredAcks is set to WaitForAll or a number > 1. Only supports millisecond resolution,
  39. // nanoseconds will be truncated. Equivalent to the JVM producer's `request.timeout.ms` setting.
  40. Timeout time.Duration
  41. // The type of compression to use on messages (defaults to no compression). Similar to `compression.codec` setting of the JVM producer.
  42. Compression CompressionCodec
  43. // Generates partitioners for choosing the partition to send messages to (defaults to hashing the message key).
  44. // Similar to the `partitioner.class` setting for the JVM producer.
  45. Partitioner PartitionerConstructor
  46. // Return specifies what channels will be populated. If they are set to true, you must read from
  47. // the respective channels to prevent deadlock.
  48. Return struct {
  49. // If enabled, successfully delivered messages will be returned on the Successes channel (default disabled).
  50. Successes bool
  51. // If enabled, messages that failed to deliver will be returned on the Errors channel, including error (default enabled).
  52. Errors bool
  53. }
  54. // The following config options control how often messages are batched up and sent to the broker. By default,
  55. // messages are sent as fast as possible, and all messages received while the current batch is in-flight are placed
  56. // into the subsequent batch.
  57. Flush struct {
  58. Bytes int // The best-effort number of bytes needed to trigger a flush. Use the global sarama.MaxRequestSize to set a hard upper limit.
  59. Messages int // The best-effort number of messages needed to trigger a flush. Use `MaxMessages` to set a hard upper limit.
  60. Frequency time.Duration // The best-effort frequency of flushes. Equivalent to `queue.buffering.max.ms` setting of JVM producer.
  61. // The maximum number of messages the producer will send in a single broker request.
  62. // Defaults to 0 for unlimited. Similar to `queue.buffering.max.messages` in the JVM producer.
  63. MaxMessages int
  64. }
  65. Retry struct {
  66. // The total number of times to retry sending a message (default 3).
  67. // Similar to the `message.send.max.retries` setting of the JVM producer.
  68. Max int
  69. // How long to wait for the cluster to settle between retries (default 100ms).
  70. // Similar to the `retry.backoff.ms` setting of the JVM producer.
  71. Backoff time.Duration
  72. }
  73. }
  74. // Consumer is the namespace for configuration related to consuming messages, used by the Consumer.
  75. Consumer struct {
  76. Retry struct {
  77. // How long to wait after a failing to read from a partition before trying again (default 2s).
  78. Backoff time.Duration
  79. }
  80. // Fetch is the namespace for controlling how many bytes are retrieved by any given request.
  81. Fetch struct {
  82. // The minimum number of message bytes to fetch in a request - the broker will wait until at least this many are available.
  83. // The default is 1, as 0 causes the consumer to spin when no messages are available. Equivalent to the JVM's `fetch.min.bytes`.
  84. Min int32
  85. // The default number of message bytes to fetch from the broker in each request (default 32768). This should be larger than the
  86. // majority of your messages, or else the consumer will spend a lot of time negotiating sizes and not actually consuming. Similar
  87. // to the JVM's `fetch.message.max.bytes`.
  88. Default int32
  89. // The maximum number of message bytes to fetch from the broker in a single request. Messages larger than this will return
  90. // ErrMessageTooLarge and will not be consumable, so you must be sure this is at least as large as your largest message.
  91. // Defaults to 0 (no limit). Similar to the JVM's `fetch.message.max.bytes`. The global `sarama.MaxResponseSize` still applies.
  92. Max int32
  93. }
  94. // The maximum amount of time the broker will wait for Consumer.Fetch.Min bytes to become available before it
  95. // returns fewer than that anyways. The default is 250ms, since 0 causes the consumer to spin when no events are available.
  96. // 100-500ms is a reasonable range for most cases. Kafka only supports precision up to milliseconds; nanoseconds will be truncated.
  97. // Equivalent to the JVM's `fetch.wait.max.ms`.
  98. MaxWaitTime time.Duration
  99. // Return specifies what channels will be populated. If they are set to true, you must read from
  100. // them to prevent deadlock.
  101. Return struct {
  102. // If enabled, any errors that occured while consuming are returned on the Errors channel (default disabled).
  103. Errors bool
  104. }
  105. }
  106. // A user-provided string sent with every request to the brokers for logging, debugging, and auditing purposes.
  107. // Defaults to "sarama", but you should probably set it to something specific to your application.
  108. ClientID string
  109. // The number of events to buffer in internal and external channels. This permits the producer and consumer to
  110. // continue processing some messages in the background while user code is working, greatly improving throughput.
  111. // Defaults to 256.
  112. ChannelBufferSize int
  113. }
  114. // NewConfig returns a new configuration instance with sane defaults.
  115. func NewConfig() *Config {
  116. c := &Config{}
  117. c.Net.MaxOpenRequests = 5
  118. c.Net.DialTimeout = 30 * time.Second
  119. c.Net.ReadTimeout = 30 * time.Second
  120. c.Net.WriteTimeout = 30 * time.Second
  121. c.Metadata.Retry.Max = 3
  122. c.Metadata.Retry.Backoff = 250 * time.Millisecond
  123. c.Metadata.RefreshFrequency = 10 * time.Minute
  124. c.Producer.MaxMessageBytes = 1000000
  125. c.Producer.RequiredAcks = WaitForLocal
  126. c.Producer.Timeout = 10 * time.Second
  127. c.Producer.Partitioner = NewHashPartitioner
  128. c.Producer.Retry.Max = 3
  129. c.Producer.Retry.Backoff = 100 * time.Millisecond
  130. c.Producer.Return.Errors = true
  131. c.Consumer.Fetch.Min = 1
  132. c.Consumer.Fetch.Default = 32768
  133. c.Consumer.Retry.Backoff = 2 * time.Second
  134. c.Consumer.MaxWaitTime = 250 * time.Millisecond
  135. c.Consumer.Return.Errors = false
  136. c.ChannelBufferSize = 256
  137. return c
  138. }
  139. // Validate checks a Config instance. It will return a
  140. // ConfigurationError if the specified values don't make sense.
  141. func (c *Config) Validate() error {
  142. // some configuration values should be warned on but not fail completely, do those first
  143. if c.Producer.RequiredAcks > 1 {
  144. Logger.Println("Producer.RequiredAcks > 1 is deprecated and will raise an exception with kafka >= 0.8.2.0.")
  145. }
  146. if c.Producer.MaxMessageBytes >= forceFlushThreshold() {
  147. Logger.Println("Producer.MaxMessageBytes is too close to MaxRequestSize; it will be ignored.")
  148. }
  149. if c.Producer.Flush.Bytes >= forceFlushThreshold() {
  150. Logger.Println("Producer.Flush.Bytes is too close to MaxRequestSize; it will be ignored.")
  151. }
  152. if c.Producer.Timeout%time.Millisecond != 0 {
  153. Logger.Println("Producer.Timeout only supports millisecond resolution; nanoseconds will be truncated.")
  154. }
  155. if c.Consumer.MaxWaitTime < 100*time.Millisecond {
  156. Logger.Println("Consumer.MaxWaitTime is very low, which can cause high CPU and network usage. See documentation for details.")
  157. }
  158. if c.Consumer.MaxWaitTime%time.Millisecond != 0 {
  159. Logger.Println("Consumer.MaxWaitTime only supports millisecond precision; nanoseconds will be truncated.")
  160. }
  161. if c.ClientID == "sarama" {
  162. Logger.Println("ClientID is the default of 'sarama', you should consider setting it to something application-specific.")
  163. }
  164. // validate Net values
  165. switch {
  166. case c.Net.MaxOpenRequests <= 0:
  167. return ConfigurationError("Invalid Net.MaxOpenRequests, must be > 0")
  168. case c.Net.DialTimeout <= 0:
  169. return ConfigurationError("Invalid Net.DialTimeout, must be > 0")
  170. case c.Net.ReadTimeout <= 0:
  171. return ConfigurationError("Invalid Net.ReadTimeout, must be > 0")
  172. case c.Net.WriteTimeout <= 0:
  173. return ConfigurationError("Invalid Net.WriteTimeout, must be > 0")
  174. }
  175. // validate the Metadata values
  176. switch {
  177. case c.Metadata.Retry.Max < 0:
  178. return ConfigurationError("Invalid Metadata.Retry.Max, must be >= 0")
  179. case c.Metadata.Retry.Backoff < 0:
  180. return ConfigurationError("Invalid Metadata.Retry.Backoff, must be >= 0")
  181. case c.Metadata.RefreshFrequency < 0:
  182. return ConfigurationError("Invalid Metadata.RefreshFrequency, must be >= 0")
  183. }
  184. // validate the Producer values
  185. switch {
  186. case c.Producer.MaxMessageBytes <= 0:
  187. return ConfigurationError("Invalid Producer.MaxMessageBytes, must be > 0")
  188. case c.Producer.RequiredAcks < -1:
  189. return ConfigurationError("Invalid Producer.RequiredAcks, must be >= -1")
  190. case c.Producer.Timeout <= 0:
  191. return ConfigurationError("Invalid Producer.Timeout, must be > 0")
  192. case c.Producer.Partitioner == nil:
  193. return ConfigurationError("Invalid Producer.Partitioner, must not be nil")
  194. case c.Producer.Flush.Bytes < 0:
  195. return ConfigurationError("Invalid Producer.Flush.Bytes, must be >= 0")
  196. case c.Producer.Flush.Messages < 0:
  197. return ConfigurationError("Invalid Producer.Flush.Messages, must be >= 0")
  198. case c.Producer.Flush.Frequency < 0:
  199. return ConfigurationError("Invalid Producer.Flush.Frequency, must be >= 0")
  200. case c.Producer.Flush.MaxMessages < 0:
  201. return ConfigurationError("Invalid Producer.Flush.MaxMessages, must be >= 0")
  202. case c.Producer.Flush.MaxMessages > 0 && c.Producer.Flush.MaxMessages < c.Producer.Flush.Messages:
  203. return ConfigurationError("Invalid Producer.Flush.MaxMessages, must be >= Producer.Flush.Messages when set")
  204. case c.Producer.Retry.Max < 0:
  205. return ConfigurationError("Invalid Producer.Retry.Max, must be >= 0")
  206. case c.Producer.Retry.Backoff < 0:
  207. return ConfigurationError("Invalid Producer.Retry.Backoff, must be >= 0")
  208. }
  209. // validate the Consumer values
  210. switch {
  211. case c.Consumer.Fetch.Min <= 0:
  212. return ConfigurationError("Invalid Consumer.Fetch.Min, must be > 0")
  213. case c.Consumer.Fetch.Default <= 0:
  214. return ConfigurationError("Invalid Consumer.Fetch.Default, must be > 0")
  215. case c.Consumer.Fetch.Max < 0:
  216. return ConfigurationError("Invalid Consumer.Fetch.Max, must be >= 0")
  217. case c.Consumer.MaxWaitTime < 1*time.Millisecond:
  218. return ConfigurationError("Invalid Consumer.MaxWaitTime, must be > 1ms")
  219. case c.Consumer.Retry.Backoff < 0:
  220. return ConfigurationError("Invalid Consumer.Retry.Backoff, must be >= 0")
  221. }
  222. // validate misc shared values
  223. switch {
  224. case c.ChannelBufferSize < 0:
  225. return ConfigurationError("Invalid ChannelBufferSize, must be >= 0")
  226. }
  227. return nil
  228. }