You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
488 lines
20 KiB
488 lines
20 KiB
package sarama |
|
|
|
import ( |
|
"compress/gzip" |
|
"crypto/tls" |
|
"fmt" |
|
"io/ioutil" |
|
"net" |
|
"regexp" |
|
"time" |
|
|
|
"github.com/rcrowley/go-metrics" |
|
) |
|
|
|
const defaultClientID = "sarama" |
|
|
|
var validID = regexp.MustCompile(`\A[A-Za-z0-9._-]+\z`) |
|
|
|
// Config is used to pass multiple configuration options to Sarama's constructors. |
|
type Config struct { |
|
// Admin is the namespace for ClusterAdmin properties used by the administrative Kafka client. |
|
Admin struct { |
|
// The maximum duration the administrative Kafka client will wait for ClusterAdmin operations, |
|
// including topics, brokers, configurations and ACLs (defaults to 3 seconds). |
|
Timeout time.Duration |
|
} |
|
|
|
// Net is the namespace for network-level properties used by the Broker, and |
|
// shared by the Client/Producer/Consumer. |
|
Net struct { |
|
// How many outstanding requests a connection is allowed to have before |
|
// sending on it blocks (default 5). |
|
MaxOpenRequests int |
|
|
|
// All three of the below configurations are similar to the |
|
// `socket.timeout.ms` setting in JVM kafka. All of them default |
|
// to 30 seconds. |
|
DialTimeout time.Duration // How long to wait for the initial connection. |
|
ReadTimeout time.Duration // How long to wait for a response. |
|
WriteTimeout time.Duration // How long to wait for a transmit. |
|
|
|
TLS struct { |
|
// Whether or not to use TLS when connecting to the broker |
|
// (defaults to false). |
|
Enable bool |
|
// The TLS configuration to use for secure connections if |
|
// enabled (defaults to nil). |
|
Config *tls.Config |
|
} |
|
|
|
// SASL based authentication with broker. While there are multiple SASL authentication methods |
|
// the current implementation is limited to plaintext (SASL/PLAIN) authentication |
|
SASL struct { |
|
// Whether or not to use SASL authentication when connecting to the broker |
|
// (defaults to false). |
|
Enable bool |
|
// Whether or not to send the Kafka SASL handshake first if enabled |
|
// (defaults to true). You should only set this to false if you're using |
|
// a non-Kafka SASL proxy. |
|
Handshake bool |
|
//username and password for SASL/PLAIN authentication |
|
User string |
|
Password string |
|
} |
|
|
|
// KeepAlive specifies the keep-alive period for an active network connection. |
|
// If zero, keep-alives are disabled. (default is 0: disabled). |
|
KeepAlive time.Duration |
|
|
|
// LocalAddr is the local address to use when dialing an |
|
// address. The address must be of a compatible type for the |
|
// network being dialed. |
|
// If nil, a local address is automatically chosen. |
|
LocalAddr net.Addr |
|
} |
|
|
|
// Metadata is the namespace for metadata management properties used by the |
|
// Client, and shared by the Producer/Consumer. |
|
Metadata struct { |
|
Retry struct { |
|
// The total number of times to retry a metadata request when the |
|
// cluster is in the middle of a leader election (default 3). |
|
Max int |
|
// How long to wait for leader election to occur before retrying |
|
// (default 250ms). Similar to the JVM's `retry.backoff.ms`. |
|
Backoff time.Duration |
|
} |
|
// How frequently to refresh the cluster metadata in the background. |
|
// Defaults to 10 minutes. Set to 0 to disable. Similar to |
|
// `topic.metadata.refresh.interval.ms` in the JVM version. |
|
RefreshFrequency time.Duration |
|
|
|
// Whether to maintain a full set of metadata for all topics, or just |
|
// the minimal set that has been necessary so far. The full set is simpler |
|
// and usually more convenient, but can take up a substantial amount of |
|
// memory if you have many topics and partitions. Defaults to true. |
|
Full bool |
|
} |
|
|
|
// Producer is the namespace for configuration related to producing messages, |
|
// used by the Producer. |
|
Producer struct { |
|
// The maximum permitted size of a message (defaults to 1000000). Should be |
|
// set equal to or smaller than the broker's `message.max.bytes`. |
|
MaxMessageBytes int |
|
// The level of acknowledgement reliability needed from the broker (defaults |
|
// to WaitForLocal). Equivalent to the `request.required.acks` setting of the |
|
// JVM producer. |
|
RequiredAcks RequiredAcks |
|
// The maximum duration the broker will wait the receipt of the number of |
|
// RequiredAcks (defaults to 10 seconds). This is only relevant when |
|
// RequiredAcks is set to WaitForAll or a number > 1. Only supports |
|
// millisecond resolution, nanoseconds will be truncated. Equivalent to |
|
// the JVM producer's `request.timeout.ms` setting. |
|
Timeout time.Duration |
|
// The type of compression to use on messages (defaults to no compression). |
|
// Similar to `compression.codec` setting of the JVM producer. |
|
Compression CompressionCodec |
|
// The level of compression to use on messages. The meaning depends |
|
// on the actual compression type used and defaults to default compression |
|
// level for the codec. |
|
CompressionLevel int |
|
// Generates partitioners for choosing the partition to send messages to |
|
// (defaults to hashing the message key). Similar to the `partitioner.class` |
|
// setting for the JVM producer. |
|
Partitioner PartitionerConstructor |
|
|
|
// Return specifies what channels will be populated. If they are set to true, |
|
// you must read from the respective channels to prevent deadlock. If, |
|
// however, this config is used to create a `SyncProducer`, both must be set |
|
// to true and you shall not read from the channels since the producer does |
|
// this internally. |
|
Return struct { |
|
// If enabled, successfully delivered messages will be returned on the |
|
// Successes channel (default disabled). |
|
Successes bool |
|
|
|
// If enabled, messages that failed to deliver will be returned on the |
|
// Errors channel, including error (default enabled). |
|
Errors bool |
|
} |
|
|
|
// The following config options control how often messages are batched up and |
|
// sent to the broker. By default, messages are sent as fast as possible, and |
|
// all messages received while the current batch is in-flight are placed |
|
// into the subsequent batch. |
|
Flush struct { |
|
// The best-effort number of bytes needed to trigger a flush. Use the |
|
// global sarama.MaxRequestSize to set a hard upper limit. |
|
Bytes int |
|
// The best-effort number of messages needed to trigger a flush. Use |
|
// `MaxMessages` to set a hard upper limit. |
|
Messages int |
|
// The best-effort frequency of flushes. Equivalent to |
|
// `queue.buffering.max.ms` setting of JVM producer. |
|
Frequency time.Duration |
|
// The maximum number of messages the producer will send in a single |
|
// broker request. Defaults to 0 for unlimited. Similar to |
|
// `queue.buffering.max.messages` in the JVM producer. |
|
MaxMessages int |
|
} |
|
|
|
Retry struct { |
|
// The total number of times to retry sending a message (default 3). |
|
// Similar to the `message.send.max.retries` setting of the JVM producer. |
|
Max int |
|
// How long to wait for the cluster to settle between retries |
|
// (default 100ms). Similar to the `retry.backoff.ms` setting of the |
|
// JVM producer. |
|
Backoff time.Duration |
|
} |
|
} |
|
|
|
// Consumer is the namespace for configuration related to consuming messages, |
|
// used by the Consumer. |
|
// |
|
// Note that Sarama's Consumer type does not currently support automatic |
|
// consumer-group rebalancing and offset tracking. For Zookeeper-based |
|
// tracking (Kafka 0.8.2 and earlier), the https://github.com/wvanbergen/kafka |
|
// library builds on Sarama to add this support. For Kafka-based tracking |
|
// (Kafka 0.9 and later), the https://github.com/bsm/sarama-cluster library |
|
// builds on Sarama to add this support. |
|
Consumer struct { |
|
Retry struct { |
|
// How long to wait after a failing to read from a partition before |
|
// trying again (default 2s). |
|
Backoff time.Duration |
|
} |
|
|
|
// Fetch is the namespace for controlling how many bytes are retrieved by any |
|
// given request. |
|
Fetch struct { |
|
// The minimum number of message bytes to fetch in a request - the broker |
|
// will wait until at least this many are available. The default is 1, |
|
// as 0 causes the consumer to spin when no messages are available. |
|
// Equivalent to the JVM's `fetch.min.bytes`. |
|
Min int32 |
|
// The default number of message bytes to fetch from the broker in each |
|
// request (default 1MB). This should be larger than the majority of |
|
// your messages, or else the consumer will spend a lot of time |
|
// negotiating sizes and not actually consuming. Similar to the JVM's |
|
// `fetch.message.max.bytes`. |
|
Default int32 |
|
// The maximum number of message bytes to fetch from the broker in a |
|
// single request. Messages larger than this will return |
|
// ErrMessageTooLarge and will not be consumable, so you must be sure |
|
// this is at least as large as your largest message. Defaults to 0 |
|
// (no limit). Similar to the JVM's `fetch.message.max.bytes`. The |
|
// global `sarama.MaxResponseSize` still applies. |
|
Max int32 |
|
} |
|
// The maximum amount of time the broker will wait for Consumer.Fetch.Min |
|
// bytes to become available before it returns fewer than that anyways. The |
|
// default is 250ms, since 0 causes the consumer to spin when no events are |
|
// available. 100-500ms is a reasonable range for most cases. Kafka only |
|
// supports precision up to milliseconds; nanoseconds will be truncated. |
|
// Equivalent to the JVM's `fetch.wait.max.ms`. |
|
MaxWaitTime time.Duration |
|
|
|
// The maximum amount of time the consumer expects a message takes to |
|
// process for the user. If writing to the Messages channel takes longer |
|
// than this, that partition will stop fetching more messages until it |
|
// can proceed again. |
|
// Note that, since the Messages channel is buffered, the actual grace time is |
|
// (MaxProcessingTime * ChanneBufferSize). Defaults to 100ms. |
|
// If a message is not written to the Messages channel between two ticks |
|
// of the expiryTicker then a timeout is detected. |
|
// Using a ticker instead of a timer to detect timeouts should typically |
|
// result in many fewer calls to Timer functions which may result in a |
|
// significant performance improvement if many messages are being sent |
|
// and timeouts are infrequent. |
|
// The disadvantage of using a ticker instead of a timer is that |
|
// timeouts will be less accurate. That is, the effective timeout could |
|
// be between `MaxProcessingTime` and `2 * MaxProcessingTime`. For |
|
// example, if `MaxProcessingTime` is 100ms then a delay of 180ms |
|
// between two messages being sent may not be recognized as a timeout. |
|
MaxProcessingTime time.Duration |
|
|
|
// Return specifies what channels will be populated. If they are set to true, |
|
// you must read from them to prevent deadlock. |
|
Return struct { |
|
// If enabled, any errors that occurred while consuming are returned on |
|
// the Errors channel (default disabled). |
|
Errors bool |
|
} |
|
|
|
// Offsets specifies configuration for how and when to commit consumed |
|
// offsets. This currently requires the manual use of an OffsetManager |
|
// but will eventually be automated. |
|
Offsets struct { |
|
// How frequently to commit updated offsets. Defaults to 1s. |
|
CommitInterval time.Duration |
|
|
|
// The initial offset to use if no offset was previously committed. |
|
// Should be OffsetNewest or OffsetOldest. Defaults to OffsetNewest. |
|
Initial int64 |
|
|
|
// The retention duration for committed offsets. If zero, disabled |
|
// (in which case the `offsets.retention.minutes` option on the |
|
// broker will be used). Kafka only supports precision up to |
|
// milliseconds; nanoseconds will be truncated. Requires Kafka |
|
// broker version 0.9.0 or later. |
|
// (default is 0: disabled). |
|
Retention time.Duration |
|
|
|
Retry struct { |
|
// The total number of times to retry failing commit |
|
// requests during OffsetManager shutdown (default 3). |
|
Max int |
|
} |
|
} |
|
} |
|
|
|
// A user-provided string sent with every request to the brokers for logging, |
|
// debugging, and auditing purposes. Defaults to "sarama", but you should |
|
// probably set it to something specific to your application. |
|
ClientID string |
|
// The number of events to buffer in internal and external channels. This |
|
// permits the producer and consumer to continue processing some messages |
|
// in the background while user code is working, greatly improving throughput. |
|
// Defaults to 256. |
|
ChannelBufferSize int |
|
// The version of Kafka that Sarama will assume it is running against. |
|
// Defaults to the oldest supported stable version. Since Kafka provides |
|
// backwards-compatibility, setting it to a version older than you have |
|
// will not break anything, although it may prevent you from using the |
|
// latest features. Setting it to a version greater than you are actually |
|
// running may lead to random breakage. |
|
Version KafkaVersion |
|
// The registry to define metrics into. |
|
// Defaults to a local registry. |
|
// If you want to disable metrics gathering, set "metrics.UseNilMetrics" to "true" |
|
// prior to starting Sarama. |
|
// See Examples on how to use the metrics registry |
|
MetricRegistry metrics.Registry |
|
} |
|
|
|
// NewConfig returns a new configuration instance with sane defaults. |
|
func NewConfig() *Config { |
|
c := &Config{} |
|
|
|
c.Admin.Timeout = 3 * time.Second |
|
|
|
c.Net.MaxOpenRequests = 5 |
|
c.Net.DialTimeout = 30 * time.Second |
|
c.Net.ReadTimeout = 30 * time.Second |
|
c.Net.WriteTimeout = 30 * time.Second |
|
c.Net.SASL.Handshake = true |
|
|
|
c.Metadata.Retry.Max = 3 |
|
c.Metadata.Retry.Backoff = 250 * time.Millisecond |
|
c.Metadata.RefreshFrequency = 10 * time.Minute |
|
c.Metadata.Full = true |
|
|
|
c.Producer.MaxMessageBytes = 1000000 |
|
c.Producer.RequiredAcks = WaitForLocal |
|
c.Producer.Timeout = 10 * time.Second |
|
c.Producer.Partitioner = NewHashPartitioner |
|
c.Producer.Retry.Max = 3 |
|
c.Producer.Retry.Backoff = 100 * time.Millisecond |
|
c.Producer.Return.Errors = true |
|
c.Producer.CompressionLevel = CompressionLevelDefault |
|
|
|
c.Consumer.Fetch.Min = 1 |
|
c.Consumer.Fetch.Default = 1024 * 1024 |
|
c.Consumer.Retry.Backoff = 2 * time.Second |
|
c.Consumer.MaxWaitTime = 250 * time.Millisecond |
|
c.Consumer.MaxProcessingTime = 100 * time.Millisecond |
|
c.Consumer.Return.Errors = false |
|
c.Consumer.Offsets.CommitInterval = 1 * time.Second |
|
c.Consumer.Offsets.Initial = OffsetNewest |
|
c.Consumer.Offsets.Retry.Max = 3 |
|
|
|
c.ClientID = defaultClientID |
|
c.ChannelBufferSize = 256 |
|
c.Version = MinVersion |
|
c.MetricRegistry = metrics.NewRegistry() |
|
|
|
return c |
|
} |
|
|
|
// Validate checks a Config instance. It will return a |
|
// ConfigurationError if the specified values don't make sense. |
|
func (c *Config) Validate() error { |
|
// some configuration values should be warned on but not fail completely, do those first |
|
if c.Net.TLS.Enable == false && c.Net.TLS.Config != nil { |
|
Logger.Println("Net.TLS is disabled but a non-nil configuration was provided.") |
|
} |
|
if c.Net.SASL.Enable == false { |
|
if c.Net.SASL.User != "" { |
|
Logger.Println("Net.SASL is disabled but a non-empty username was provided.") |
|
} |
|
if c.Net.SASL.Password != "" { |
|
Logger.Println("Net.SASL is disabled but a non-empty password was provided.") |
|
} |
|
} |
|
if c.Producer.RequiredAcks > 1 { |
|
Logger.Println("Producer.RequiredAcks > 1 is deprecated and will raise an exception with kafka >= 0.8.2.0.") |
|
} |
|
if c.Producer.MaxMessageBytes >= int(MaxRequestSize) { |
|
Logger.Println("Producer.MaxMessageBytes must be smaller than MaxRequestSize; it will be ignored.") |
|
} |
|
if c.Producer.Flush.Bytes >= int(MaxRequestSize) { |
|
Logger.Println("Producer.Flush.Bytes must be smaller than MaxRequestSize; it will be ignored.") |
|
} |
|
if (c.Producer.Flush.Bytes > 0 || c.Producer.Flush.Messages > 0) && c.Producer.Flush.Frequency == 0 { |
|
Logger.Println("Producer.Flush: Bytes or Messages are set, but Frequency is not; messages may not get flushed.") |
|
} |
|
if c.Producer.Timeout%time.Millisecond != 0 { |
|
Logger.Println("Producer.Timeout only supports millisecond resolution; nanoseconds will be truncated.") |
|
} |
|
if c.Consumer.MaxWaitTime < 100*time.Millisecond { |
|
Logger.Println("Consumer.MaxWaitTime is very low, which can cause high CPU and network usage. See documentation for details.") |
|
} |
|
if c.Consumer.MaxWaitTime%time.Millisecond != 0 { |
|
Logger.Println("Consumer.MaxWaitTime only supports millisecond precision; nanoseconds will be truncated.") |
|
} |
|
if c.Consumer.Offsets.Retention%time.Millisecond != 0 { |
|
Logger.Println("Consumer.Offsets.Retention only supports millisecond precision; nanoseconds will be truncated.") |
|
} |
|
if c.ClientID == defaultClientID { |
|
Logger.Println("ClientID is the default of 'sarama', you should consider setting it to something application-specific.") |
|
} |
|
|
|
// validate Net values |
|
switch { |
|
case c.Net.MaxOpenRequests <= 0: |
|
return ConfigurationError("Net.MaxOpenRequests must be > 0") |
|
case c.Net.DialTimeout <= 0: |
|
return ConfigurationError("Net.DialTimeout must be > 0") |
|
case c.Net.ReadTimeout <= 0: |
|
return ConfigurationError("Net.ReadTimeout must be > 0") |
|
case c.Net.WriteTimeout <= 0: |
|
return ConfigurationError("Net.WriteTimeout must be > 0") |
|
case c.Net.KeepAlive < 0: |
|
return ConfigurationError("Net.KeepAlive must be >= 0") |
|
case c.Net.SASL.Enable == true && c.Net.SASL.User == "": |
|
return ConfigurationError("Net.SASL.User must not be empty when SASL is enabled") |
|
case c.Net.SASL.Enable == true && c.Net.SASL.Password == "": |
|
return ConfigurationError("Net.SASL.Password must not be empty when SASL is enabled") |
|
} |
|
|
|
// validate the Admin values |
|
switch { |
|
case c.Admin.Timeout <= 0: |
|
return ConfigurationError("Admin.Timeout must be > 0") |
|
} |
|
|
|
// validate the Metadata values |
|
switch { |
|
case c.Metadata.Retry.Max < 0: |
|
return ConfigurationError("Metadata.Retry.Max must be >= 0") |
|
case c.Metadata.Retry.Backoff < 0: |
|
return ConfigurationError("Metadata.Retry.Backoff must be >= 0") |
|
case c.Metadata.RefreshFrequency < 0: |
|
return ConfigurationError("Metadata.RefreshFrequency must be >= 0") |
|
} |
|
|
|
// validate the Producer values |
|
switch { |
|
case c.Producer.MaxMessageBytes <= 0: |
|
return ConfigurationError("Producer.MaxMessageBytes must be > 0") |
|
case c.Producer.RequiredAcks < -1: |
|
return ConfigurationError("Producer.RequiredAcks must be >= -1") |
|
case c.Producer.Timeout <= 0: |
|
return ConfigurationError("Producer.Timeout must be > 0") |
|
case c.Producer.Partitioner == nil: |
|
return ConfigurationError("Producer.Partitioner must not be nil") |
|
case c.Producer.Flush.Bytes < 0: |
|
return ConfigurationError("Producer.Flush.Bytes must be >= 0") |
|
case c.Producer.Flush.Messages < 0: |
|
return ConfigurationError("Producer.Flush.Messages must be >= 0") |
|
case c.Producer.Flush.Frequency < 0: |
|
return ConfigurationError("Producer.Flush.Frequency must be >= 0") |
|
case c.Producer.Flush.MaxMessages < 0: |
|
return ConfigurationError("Producer.Flush.MaxMessages must be >= 0") |
|
case c.Producer.Flush.MaxMessages > 0 && c.Producer.Flush.MaxMessages < c.Producer.Flush.Messages: |
|
return ConfigurationError("Producer.Flush.MaxMessages must be >= Producer.Flush.Messages when set") |
|
case c.Producer.Retry.Max < 0: |
|
return ConfigurationError("Producer.Retry.Max must be >= 0") |
|
case c.Producer.Retry.Backoff < 0: |
|
return ConfigurationError("Producer.Retry.Backoff must be >= 0") |
|
} |
|
|
|
if c.Producer.Compression == CompressionLZ4 && !c.Version.IsAtLeast(V0_10_0_0) { |
|
return ConfigurationError("lz4 compression requires Version >= V0_10_0_0") |
|
} |
|
|
|
if c.Producer.Compression == CompressionGZIP { |
|
if c.Producer.CompressionLevel != CompressionLevelDefault { |
|
if _, err := gzip.NewWriterLevel(ioutil.Discard, c.Producer.CompressionLevel); err != nil { |
|
return ConfigurationError(fmt.Sprintf("gzip compression does not work with level %d: %v", c.Producer.CompressionLevel, err)) |
|
} |
|
} |
|
} |
|
|
|
// validate the Consumer values |
|
switch { |
|
case c.Consumer.Fetch.Min <= 0: |
|
return ConfigurationError("Consumer.Fetch.Min must be > 0") |
|
case c.Consumer.Fetch.Default <= 0: |
|
return ConfigurationError("Consumer.Fetch.Default must be > 0") |
|
case c.Consumer.Fetch.Max < 0: |
|
return ConfigurationError("Consumer.Fetch.Max must be >= 0") |
|
case c.Consumer.MaxWaitTime < 1*time.Millisecond: |
|
return ConfigurationError("Consumer.MaxWaitTime must be >= 1ms") |
|
case c.Consumer.MaxProcessingTime <= 0: |
|
return ConfigurationError("Consumer.MaxProcessingTime must be > 0") |
|
case c.Consumer.Retry.Backoff < 0: |
|
return ConfigurationError("Consumer.Retry.Backoff must be >= 0") |
|
case c.Consumer.Offsets.CommitInterval <= 0: |
|
return ConfigurationError("Consumer.Offsets.CommitInterval must be > 0") |
|
case c.Consumer.Offsets.Initial != OffsetOldest && c.Consumer.Offsets.Initial != OffsetNewest: |
|
return ConfigurationError("Consumer.Offsets.Initial must be OffsetOldest or OffsetNewest") |
|
case c.Consumer.Offsets.Retry.Max < 0: |
|
return ConfigurationError("Consumer.Offsets.Retry.Max must be >= 0") |
|
} |
|
|
|
// validate misc shared values |
|
switch { |
|
case c.ChannelBufferSize < 0: |
|
return ConfigurationError("ChannelBufferSize must be >= 0") |
|
case !validID.MatchString(c.ClientID): |
|
return ConfigurationError("ClientID is invalid") |
|
} |
|
|
|
return nil |
|
}
|
|
|