telegraf/internal/models/running_output.go

package models

import (
	"log"
	"sync"
	"time"

	"github.com/influxdata/telegraf"
	"github.com/influxdata/telegraf/internal/buffer"
	"github.com/influxdata/telegraf/metric"
	"github.com/influxdata/telegraf/selfstat"
)

const (
	// Default size of metrics batch size.
	DEFAULT_METRIC_BATCH_SIZE = 1000

	// Default number of metrics kept. It should be a multiple of batch size.
	DEFAULT_METRIC_BUFFER_LIMIT = 10000
)

// RunningOutput contains the output configuration
type RunningOutput struct {
	Name              string
	Output            telegraf.Output
	Config            *OutputConfig
	MetricBufferLimit int
	MetricBatchSize   int

	MetricsFiltered selfstat.Stat
	MetricsWritten  selfstat.Stat
	BufferSize      selfstat.Stat
	BufferLimit     selfstat.Stat
	WriteTime       selfstat.Stat

	metrics     *buffer.Buffer
	failMetrics *buffer.Buffer

	// Guards against concurrent calls to the Output as described in #3009
	sync.Mutex
}

func NewRunningOutput(
	name string,
	output telegraf.Output,
	conf *OutputConfig,
	batchSize int,
	bufferLimit int,
) *RunningOutput {
	if bufferLimit == 0 {
		bufferLimit = DEFAULT_METRIC_BUFFER_LIMIT
	}
	if batchSize == 0 {
		batchSize = DEFAULT_METRIC_BATCH_SIZE
	}
	ro := &RunningOutput{
		Name:              name,
		metrics:           buffer.NewBuffer(batchSize),
		failMetrics:       buffer.NewBuffer(bufferLimit),
		Output:            output,
		Config:            conf,
		MetricBufferLimit: bufferLimit,
		MetricBatchSize:   batchSize,
		MetricsWritten: selfstat.Register(
			"write",
			"metrics_written",
			map[string]string{"output": name},
		),
		MetricsFiltered: selfstat.Register(
			"write",
			"metrics_filtered",
			map[string]string{"output": name},
		),
		BufferSize: selfstat.Register(
			"write",
			"buffer_size",
			map[string]string{"output": name},
		),
		BufferLimit: selfstat.Register(
			"write",
			"buffer_limit",
			map[string]string{"output": name},
		),
		WriteTime: selfstat.RegisterTiming(
			"write",
			"write_time_ns",
			map[string]string{"output": name},
		),
	}
	ro.BufferLimit.Incr(int64(ro.MetricBufferLimit))
	return ro
}

// AddMetric adds a metric to the output. This function can also write cached
// points if FlushBufferWhenFull is true.
func (ro *RunningOutput) AddMetric(m telegraf.Metric) {
	if m == nil {
		return
	}
	// Filter any tagexclude/taginclude parameters before adding metric
	if ro.Config.Filter.IsActive() {
		// In order to filter out tags, we need to create a new metric, since
		// metrics are immutable once created.
		name := m.Name()
		tags := m.Tags()
		fields := m.Fields()
		t := m.Time()
		if ok := ro.Config.Filter.Apply(name, fields, tags); !ok {
			ro.MetricsFiltered.Incr(1)
			return
		}
		// error is not possible if creating from another metric, so ignore.
		m, _ = metric.New(name, tags, fields, t)
	}

	ro.metrics.Add(m)
	if ro.metrics.Len() == ro.MetricBatchSize {
		batch := ro.metrics.Batch(ro.MetricBatchSize)
		err := ro.write(batch)
		if err != nil {
			ro.failMetrics.Add(batch...)
		}
	}
}

// Write writes all cached points to this output.
func (ro *RunningOutput) Write() error {
	nFails, nMetrics := ro.failMetrics.Len(), ro.metrics.Len()
	ro.BufferSize.Set(int64(nFails + nMetrics))
	log.Printf("D! Output [%s] buffer fullness: %d / %d metrics. ",
		ro.Name, nFails+nMetrics, ro.MetricBufferLimit)
	var err error
	if !ro.failMetrics.IsEmpty() {
		// how many batches of failed writes we need to write.
		nBatches := nFails/ro.MetricBatchSize + 1
		batchSize := ro.MetricBatchSize

		for i := 0; i < nBatches; i++ {
			// If it's the last batch, only grab the metrics that have not had
			// a write attempt already (this is primarily to preserve order).
			if i == nBatches-1 {
				batchSize = nFails % ro.MetricBatchSize
			}
			batch := ro.failMetrics.Batch(batchSize)
			// If we've already failed previous writes, don't bother trying to
			// write to this output again. We are not exiting the loop just so
			// that we can rotate the metrics to preserve order.
			if err == nil {
				err = ro.write(batch)
			}
			if err != nil {
				ro.failMetrics.Add(batch...)
			}
		}
	}

	batch := ro.metrics.Batch(ro.MetricBatchSize)
	// see comment above about not trying to write to an already failed output.
	// if ro.failMetrics is empty then err will always be nil at this point.
	if err == nil {
		err = ro.write(batch)
	}

	if err != nil {
		ro.failMetrics.Add(batch...)
		return err
	}
	return nil
}

func (ro *RunningOutput) write(metrics []telegraf.Metric) error {
	nMetrics := len(metrics)
	if nMetrics == 0 {
		return nil
	}
	ro.Lock()
	defer ro.Unlock()
	start := time.Now()
	err := ro.Output.Write(metrics)
	elapsed := time.Since(start)
	if err == nil {
		log.Printf("D! Output [%s] wrote batch of %d metrics in %s\n",
			ro.Name, nMetrics, elapsed)
		ro.MetricsWritten.Incr(int64(nMetrics))
		ro.WriteTime.Incr(elapsed.Nanoseconds())
	}
	return err
}

// OutputConfig containing name and filter
type OutputConfig struct {
	Name   string
	Filter Filter
}
Rename internal_models package to models 2016-07-28 11:31:11 +00:00			`package models`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00
			`import (`
			`"log"`
Prevent Write from being called concurrently (#3011) 2017-07-12 19:03:23 +00:00			`"sync"`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`"time"`

Create public models for telegraf metrics, accumlator, plugins This will basically make the root directory a place for storing the major telegraf interfaces, which will make telegraf's godoc looks quite a bit nicer. And make it easier for contributors to lookup the few data types that they actually care about. closes #564 2016-01-27 21:21:36 +00:00			`"github.com/influxdata/telegraf"`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`"github.com/influxdata/telegraf/internal/buffer"`
Implement telegraf's own full metric type main reasons behind this: - make adding/removing tags cheap - make adding/removing fields cheap - make parsing cheaper - make parse -> decorate -> write out bytes metric flow much faster Refactor serializer to use byte buffer 2016-11-22 12:51:57 +00:00			`"github.com/influxdata/telegraf/metric"`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`"github.com/influxdata/telegraf/selfstat"`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`)`

Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`const (`
Refactor running_output buffering closes #1087 2016-04-24 10:43:54 +00:00			`// Default size of metrics batch size.`
			`DEFAULT_METRIC_BATCH_SIZE = 1000`

			`// Default number of metrics kept. It should be a multiple of batch size.`
			`DEFAULT_METRIC_BUFFER_LIMIT = 10000`
Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`)`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`// RunningOutput contains the output configuration`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`type RunningOutput struct {`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`Name string`
			`Output telegraf.Output`
			`Config *OutputConfig`
			`MetricBufferLimit int`
			`MetricBatchSize int`

Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`MetricsFiltered selfstat.Stat`
			`MetricsWritten selfstat.Stat`
			`BufferSize selfstat.Stat`
			`BufferLimit selfstat.Stat`
			`WriteTime selfstat.Stat`

Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`metrics *buffer.Buffer`
			`failMetrics *buffer.Buffer`
Prevent Write from being called concurrently (#3011) 2017-07-12 19:03:23 +00:00
			`// Guards against concurrent calls to the Output as described in #3009`
			`sync.Mutex`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`}`

			`func NewRunningOutput(`
			`name string,`
Create public models for telegraf metrics, accumlator, plugins This will basically make the root directory a place for storing the major telegraf interfaces, which will make telegraf's godoc looks quite a bit nicer. And make it easier for contributors to lookup the few data types that they actually care about. closes #564 2016-01-27 21:21:36 +00:00			`output telegraf.Output,`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`conf *OutputConfig,`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`batchSize int,`
			`bufferLimit int,`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`) *RunningOutput {`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`if bufferLimit == 0 {`
			`bufferLimit = DEFAULT_METRIC_BUFFER_LIMIT`
			`}`
			`if batchSize == 0 {`
			`batchSize = DEFAULT_METRIC_BATCH_SIZE`
			`}`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`ro := &RunningOutput{`
Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`Name: name,`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`metrics: buffer.NewBuffer(batchSize),`
			`failMetrics: buffer.NewBuffer(bufferLimit),`
Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`Output: output,`
			`Config: conf,`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`MetricBufferLimit: bufferLimit,`
			`MetricBatchSize: batchSize,`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`MetricsWritten: selfstat.Register(`
			`"write",`
			`"metrics_written",`
			`map[string]string{"output": name},`
			`),`
			`MetricsFiltered: selfstat.Register(`
			`"write",`
			`"metrics_filtered",`
			`map[string]string{"output": name},`
			`),`
			`BufferSize: selfstat.Register(`
			`"write",`
			`"buffer_size",`
			`map[string]string{"output": name},`
			`),`
			`BufferLimit: selfstat.Register(`
			`"write",`
			`"buffer_limit",`
			`map[string]string{"output": name},`
			`),`
			`WriteTime: selfstat.RegisterTiming(`
			`"write",`
			`"write_time_ns",`
			`map[string]string{"output": name},`
			`),`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`}`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`ro.BufferLimit.Incr(int64(ro.MetricBufferLimit))`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`return ro`
			`}`

Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`// AddMetric adds a metric to the output. This function can also write cached`
			`// points if FlushBufferWhenFull is true.`
Implement telegraf's own full metric type main reasons behind this: - make adding/removing tags cheap - make adding/removing fields cheap - make parsing cheaper - make parse -> decorate -> write out bytes metric flow much faster Refactor serializer to use byte buffer 2016-11-22 12:51:57 +00:00			`func (ro *RunningOutput) AddMetric(m telegraf.Metric) {`
running output: Drop nil metrics fixes #2317 2017-02-01 08:55:22 +00:00			`if m == nil {`
			`return`
			`}`
Adds support for removing/keeping tags from metrics closes #706 2016-04-12 23:06:27 +00:00			`// Filter any tagexclude/taginclude parameters before adding metric`
Refactor and code cleanup of filtering started working on this with the idea of fixing #1623, although I realized that this was actually just a documentation issue around a toml eccentricity. closes #1623 2016-09-05 15:16:37 +00:00			`if ro.Config.Filter.IsActive() {`
Adds support for removing/keeping tags from metrics closes #706 2016-04-12 23:06:27 +00:00			`// In order to filter out tags, we need to create a new metric, since`
			`// metrics are immutable once created.`
Implement telegraf's own full metric type main reasons behind this: - make adding/removing tags cheap - make adding/removing fields cheap - make parsing cheaper - make parse -> decorate -> write out bytes metric flow much faster Refactor serializer to use byte buffer 2016-11-22 12:51:57 +00:00			`name := m.Name()`
			`tags := m.Tags()`
			`fields := m.Fields()`
			`t := m.Time()`
Refactor and code cleanup of filtering started working on this with the idea of fixing #1623, although I realized that this was actually just a documentation issue around a toml eccentricity. closes #1623 2016-09-05 15:16:37 +00:00			`if ok := ro.Config.Filter.Apply(name, fields, tags); !ok {`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`ro.MetricsFiltered.Incr(1)`
Refactor and code cleanup of filtering started working on this with the idea of fixing #1623, although I realized that this was actually just a documentation issue around a toml eccentricity. closes #1623 2016-09-05 15:16:37 +00:00			`return`
			`}`
Adds support for removing/keeping tags from metrics closes #706 2016-04-12 23:06:27 +00:00			`// error is not possible if creating from another metric, so ignore.`
Implement telegraf's own full metric type main reasons behind this: - make adding/removing tags cheap - make adding/removing fields cheap - make parsing cheaper - make parse -> decorate -> write out bytes metric flow much faster Refactor serializer to use byte buffer 2016-11-22 12:51:57 +00:00			`m, _ = metric.New(name, tags, fields, t)`
Adds support for removing/keeping tags from metrics closes #706 2016-04-12 23:06:27 +00:00			`}`

Implement telegraf's own full metric type main reasons behind this: - make adding/removing tags cheap - make adding/removing fields cheap - make parsing cheaper - make parse -> decorate -> write out bytes metric flow much faster Refactor serializer to use byte buffer 2016-11-22 12:51:57 +00:00			`ro.metrics.Add(m)`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`if ro.metrics.Len() == ro.MetricBatchSize {`
			`batch := ro.metrics.Batch(ro.MetricBatchSize)`
			`err := ro.write(batch)`
			`if err != nil {`
			`ro.failMetrics.Add(batch...)`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`}`
			`}`
			`}`

Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`// Write writes all cached points to this output.`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`func (ro *RunningOutput) Write() error {`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`nFails, nMetrics := ro.failMetrics.Len(), ro.metrics.Len()`
Only set the buffer size once fixes #2380 2017-02-16 19:37:55 +00:00			`ro.BufferSize.Set(int64(nFails + nMetrics))`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`log.Printf("D! Output [%s] buffer fullness: %d / %d metrics. ",`
			`ro.Name, nFails+nMetrics, ro.MetricBufferLimit)`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`var err error`
			`if !ro.failMetrics.IsEmpty() {`
			`// how many batches of failed writes we need to write.`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`nBatches := nFails/ro.MetricBatchSize + 1`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`batchSize := ro.MetricBatchSize`

			`for i := 0; i < nBatches; i++ {`
			`// If it's the last batch, only grab the metrics that have not had`
			`// a write attempt already (this is primarily to preserve order).`
			`if i == nBatches-1 {`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`batchSize = nFails % ro.MetricBatchSize`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`}`
			`batch := ro.failMetrics.Batch(batchSize)`
			`// If we've already failed previous writes, don't bother trying to`
			`// write to this output again. We are not exiting the loop just so`
			`// that we can rotate the metrics to preserve order.`
			`if err == nil {`
			`err = ro.write(batch)`
			`}`
			`if err != nil {`
			`ro.failMetrics.Add(batch...)`
			`}`
Refactor running_output buffering closes #1087 2016-04-24 10:43:54 +00:00			`}`
			`}`

Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`batch := ro.metrics.Batch(ro.MetricBatchSize)`
			`// see comment above about not trying to write to an already failed output.`
			`// if ro.failMetrics is empty then err will always be nil at this point.`
			`if err == nil {`
			`err = ro.write(batch)`
			`}`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00
Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`if err != nil {`
Performance refactor of running_output buffers closes #914 closes #967 2016-04-25 23:49:06 +00:00			`ro.failMetrics.Add(batch...)`
Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`return err`
			`}`
			`return nil`
			`}`

			`func (ro *RunningOutput) write(metrics []telegraf.Metric) error {`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`nMetrics := len(metrics)`
			`if nMetrics == 0 {`
Do not write metrics if there are 0 to write closes #884 2016-03-18 16:51:14 +00:00			`return nil`
			`}`
Prevent Write from being called concurrently (#3011) 2017-07-12 19:03:23 +00:00			`ro.Lock()`
			`defer ro.Unlock()`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`start := time.Now()`
Flush based on buffer size rather than time this includes: - Add Accumulator to the Start() function of service inputs - For message consumer plugins, use the Accumulator to constantly add metrics and make Gather a dummy function - rework unit tests to match this new behavior. - make "flush_buffer_when_full" a config option that defaults to true closes #666 2016-02-16 00:21:38 +00:00			`err := ro.Output.Write(metrics)`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`elapsed := time.Since(start)`
			`if err == nil {`
Implement telegraf collecting stats on itself closes #1348 2016-11-07 08:34:46 +00:00			`log.Printf("D! Output [%s] wrote batch of %d metrics in %s\n",`
			`ro.Name, nMetrics, elapsed)`
			`ro.MetricsWritten.Incr(int64(nMetrics))`
			`ro.WriteTime.Incr(elapsed.Nanoseconds())`
Implement a per-output fixed size metric buffer Also moved some objects out of config.go and put them in their own package, internal/models fixes #568 closes #285 2016-01-22 18:54:12 +00:00			`}`
			`return err`
			`}`

			`// OutputConfig containing name and filter`
			`type OutputConfig struct {`
			`Name string`
			`Filter Filter`
			`}`