2015-06-27 03:56:14 +00:00
|
|
|
package kafka_consumer
|
|
|
|
|
|
|
|
import (
|
2016-02-06 00:36:35 +00:00
|
|
|
"fmt"
|
2015-11-16 20:12:45 +00:00
|
|
|
"log"
|
|
|
|
"strings"
|
|
|
|
"sync"
|
2015-06-27 03:56:14 +00:00
|
|
|
|
2016-01-27 21:21:36 +00:00
|
|
|
"github.com/influxdata/telegraf"
|
2016-01-20 18:57:35 +00:00
|
|
|
"github.com/influxdata/telegraf/plugins/inputs"
|
2016-02-06 00:36:35 +00:00
|
|
|
"github.com/influxdata/telegraf/plugins/parsers"
|
2015-11-16 20:12:45 +00:00
|
|
|
|
|
|
|
"github.com/Shopify/sarama"
|
2015-06-27 03:56:14 +00:00
|
|
|
"github.com/wvanbergen/kafka/consumergroup"
|
|
|
|
)
|
|
|
|
|
|
|
|
type Kafka struct {
|
2015-11-16 20:12:45 +00:00
|
|
|
ConsumerGroup string
|
|
|
|
Topics []string
|
|
|
|
ZookeeperPeers []string
|
|
|
|
Consumer *consumergroup.ConsumerGroup
|
2016-02-09 22:03:46 +00:00
|
|
|
MetricBuffer int
|
|
|
|
// TODO remove PointBuffer, legacy support
|
|
|
|
PointBuffer int
|
|
|
|
Offset string
|
2015-11-16 20:12:45 +00:00
|
|
|
|
2016-02-06 00:36:35 +00:00
|
|
|
parser parsers.Parser
|
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
sync.Mutex
|
|
|
|
|
|
|
|
// channel for all incoming kafka messages
|
|
|
|
in <-chan *sarama.ConsumerMessage
|
|
|
|
// channel for all kafka consumer errors
|
|
|
|
errs <-chan *sarama.ConsumerError
|
2016-02-09 22:03:46 +00:00
|
|
|
// channel for all incoming parsed kafka metrics
|
2016-01-27 23:15:14 +00:00
|
|
|
metricC chan telegraf.Metric
|
|
|
|
done chan struct{}
|
2015-11-16 20:12:45 +00:00
|
|
|
|
|
|
|
// doNotCommitMsgs tells the parser not to call CommitUpTo on the consumer
|
|
|
|
// this is mostly for test purposes, but there may be a use-case for it later.
|
|
|
|
doNotCommitMsgs bool
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
var sampleConfig = `
|
2016-02-06 00:36:35 +00:00
|
|
|
### topic(s) to consume
|
2015-11-16 20:12:45 +00:00
|
|
|
topics = ["telegraf"]
|
2016-02-06 00:36:35 +00:00
|
|
|
### an array of Zookeeper connection strings
|
2015-11-16 20:12:45 +00:00
|
|
|
zookeeper_peers = ["localhost:2181"]
|
2016-02-06 00:36:35 +00:00
|
|
|
### the name of the consumer group
|
2015-11-16 20:12:45 +00:00
|
|
|
consumer_group = "telegraf_metrics_consumers"
|
2016-02-09 22:03:46 +00:00
|
|
|
### Maximum number of metrics to buffer between collection intervals
|
|
|
|
metric_buffer = 100000
|
2016-02-06 00:36:35 +00:00
|
|
|
### Offset (must be either "oldest" or "newest")
|
2015-11-16 20:12:45 +00:00
|
|
|
offset = "oldest"
|
2016-02-06 00:36:35 +00:00
|
|
|
|
|
|
|
### Data format to consume. This can be "json", "influx" or "graphite"
|
|
|
|
### Each data format has it's own unique set of configuration options, read
|
|
|
|
### more about them here:
|
2016-02-09 04:36:53 +00:00
|
|
|
### https://github.com/influxdata/telegraf/blob/master/DATA_FORMATS_INPUT.md
|
2016-02-06 00:36:35 +00:00
|
|
|
data_format = "influx"
|
2015-08-26 15:21:39 +00:00
|
|
|
`
|
2015-06-27 03:56:14 +00:00
|
|
|
|
|
|
|
func (k *Kafka) SampleConfig() string {
|
|
|
|
return sampleConfig
|
|
|
|
}
|
|
|
|
|
|
|
|
func (k *Kafka) Description() string {
|
2016-02-06 00:36:35 +00:00
|
|
|
return "Read metrics from Kafka topic(s)"
|
|
|
|
}
|
|
|
|
|
|
|
|
func (k *Kafka) SetParser(parser parsers.Parser) {
|
|
|
|
k.parser = parser
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
func (k *Kafka) Start() error {
|
|
|
|
k.Lock()
|
|
|
|
defer k.Unlock()
|
2015-06-27 03:56:14 +00:00
|
|
|
var consumerErr error
|
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
config := consumergroup.NewConfig()
|
|
|
|
switch strings.ToLower(k.Offset) {
|
|
|
|
case "oldest", "":
|
|
|
|
config.Offsets.Initial = sarama.OffsetOldest
|
|
|
|
case "newest":
|
|
|
|
config.Offsets.Initial = sarama.OffsetNewest
|
|
|
|
default:
|
|
|
|
log.Printf("WARNING: Kafka consumer invalid offset '%s', using 'oldest'\n",
|
|
|
|
k.Offset)
|
|
|
|
config.Offsets.Initial = sarama.OffsetOldest
|
|
|
|
}
|
|
|
|
|
|
|
|
if k.Consumer == nil || k.Consumer.Closed() {
|
2015-06-27 03:56:14 +00:00
|
|
|
k.Consumer, consumerErr = consumergroup.JoinConsumerGroup(
|
2015-11-16 20:12:45 +00:00
|
|
|
k.ConsumerGroup,
|
|
|
|
k.Topics,
|
2015-06-27 03:56:14 +00:00
|
|
|
k.ZookeeperPeers,
|
2015-11-16 20:12:45 +00:00
|
|
|
config,
|
2015-06-27 03:56:14 +00:00
|
|
|
)
|
|
|
|
if consumerErr != nil {
|
|
|
|
return consumerErr
|
|
|
|
}
|
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
// Setup message and error channels
|
|
|
|
k.in = k.Consumer.Messages()
|
|
|
|
k.errs = k.Consumer.Errors()
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
k.done = make(chan struct{})
|
2016-02-09 22:03:46 +00:00
|
|
|
if k.PointBuffer == 0 && k.MetricBuffer == 0 {
|
|
|
|
k.MetricBuffer = 100000
|
|
|
|
} else if k.PointBuffer > 0 {
|
|
|
|
// Legacy support of PointBuffer field TODO remove
|
|
|
|
k.MetricBuffer = k.PointBuffer
|
2015-11-16 20:12:45 +00:00
|
|
|
}
|
2016-02-09 22:03:46 +00:00
|
|
|
k.metricC = make(chan telegraf.Metric, k.MetricBuffer)
|
2015-06-27 03:56:14 +00:00
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
// Start the kafka message reader
|
2016-02-06 00:36:35 +00:00
|
|
|
go k.receiver()
|
2015-11-16 20:12:45 +00:00
|
|
|
log.Printf("Started the kafka consumer service, peers: %v, topics: %v\n",
|
|
|
|
k.ZookeeperPeers, k.Topics)
|
|
|
|
return nil
|
|
|
|
}
|
2015-06-27 03:56:14 +00:00
|
|
|
|
2016-02-06 00:36:35 +00:00
|
|
|
// receiver() reads all incoming messages from the consumer, and parses them into
|
2015-11-16 20:12:45 +00:00
|
|
|
// influxdb metric points.
|
2016-02-06 00:36:35 +00:00
|
|
|
func (k *Kafka) receiver() {
|
2015-06-27 03:56:14 +00:00
|
|
|
for {
|
|
|
|
select {
|
2015-11-16 20:12:45 +00:00
|
|
|
case <-k.done:
|
|
|
|
return
|
|
|
|
case err := <-k.errs:
|
|
|
|
log.Printf("Kafka Consumer Error: %s\n", err.Error())
|
|
|
|
case msg := <-k.in:
|
2016-02-06 00:36:35 +00:00
|
|
|
metrics, err := k.parser.Parse(msg.Value)
|
2015-11-16 20:12:45 +00:00
|
|
|
if err != nil {
|
2016-02-09 22:03:46 +00:00
|
|
|
log.Printf("KAFKA PARSE ERROR\nmessage: %s\nerror: %s",
|
2015-11-16 20:12:45 +00:00
|
|
|
string(msg.Value), err.Error())
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
|
|
|
|
2016-01-27 23:15:14 +00:00
|
|
|
for _, metric := range metrics {
|
2016-02-06 00:36:35 +00:00
|
|
|
fmt.Println(string(metric.Name()))
|
2015-11-16 20:12:45 +00:00
|
|
|
select {
|
2016-01-27 23:15:14 +00:00
|
|
|
case k.metricC <- metric:
|
2015-11-16 20:12:45 +00:00
|
|
|
continue
|
|
|
|
default:
|
2016-01-27 23:15:14 +00:00
|
|
|
log.Printf("Kafka Consumer buffer is full, dropping a metric." +
|
2016-02-09 22:03:46 +00:00
|
|
|
" You may want to increase the metric_buffer setting")
|
2015-11-16 20:12:45 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if !k.doNotCommitMsgs {
|
|
|
|
// TODO(cam) this locking can be removed if this PR gets merged:
|
|
|
|
// https://github.com/wvanbergen/kafka/pull/84
|
|
|
|
k.Lock()
|
|
|
|
k.Consumer.CommitUpto(msg)
|
|
|
|
k.Unlock()
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-11-16 20:12:45 +00:00
|
|
|
func (k *Kafka) Stop() {
|
|
|
|
k.Lock()
|
|
|
|
defer k.Unlock()
|
|
|
|
close(k.done)
|
|
|
|
if err := k.Consumer.Close(); err != nil {
|
|
|
|
log.Printf("Error closing kafka consumer: %s\n", err.Error())
|
|
|
|
}
|
|
|
|
}
|
2015-06-27 03:56:14 +00:00
|
|
|
|
2016-01-27 21:21:36 +00:00
|
|
|
func (k *Kafka) Gather(acc telegraf.Accumulator) error {
|
2015-11-16 20:12:45 +00:00
|
|
|
k.Lock()
|
|
|
|
defer k.Unlock()
|
2016-02-09 22:03:46 +00:00
|
|
|
nmetrics := len(k.metricC)
|
|
|
|
for i := 0; i < nmetrics; i++ {
|
|
|
|
metric := <-k.metricC
|
|
|
|
acc.AddFields(metric.Name(), metric.Fields(), metric.Tags(), metric.Time())
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
2015-11-16 20:12:45 +00:00
|
|
|
return nil
|
2015-06-27 03:56:14 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func init() {
|
2016-01-27 21:21:36 +00:00
|
|
|
inputs.Add("kafka_consumer", func() telegraf.Input {
|
2015-06-27 03:56:14 +00:00
|
|
|
return &Kafka{}
|
|
|
|
})
|
|
|
|
}
|