205 lines
8.0 KiB
Go
205 lines
8.0 KiB
Go
package riak
|
|
|
|
import (
|
|
"encoding/json"
|
|
"fmt"
|
|
"net/http"
|
|
"net/url"
|
|
"time"
|
|
|
|
"github.com/influxdata/telegraf"
|
|
"github.com/influxdata/telegraf/plugins/inputs"
|
|
)
|
|
|
|
// Type Riak gathers statistics from one or more Riak instances
|
|
type Riak struct {
|
|
// Servers is a slice of servers as http addresses (ex. http://127.0.0.1:8098)
|
|
Servers []string
|
|
|
|
client *http.Client
|
|
}
|
|
|
|
// NewRiak return a new instance of Riak with a default http client
|
|
func NewRiak() *Riak {
|
|
tr := &http.Transport{ResponseHeaderTimeout: time.Duration(3 * time.Second)}
|
|
client := &http.Client{
|
|
Transport: tr,
|
|
Timeout: time.Duration(4 * time.Second),
|
|
}
|
|
return &Riak{client: client}
|
|
}
|
|
|
|
// Type riakStats represents the data that is received from Riak
|
|
type riakStats struct {
|
|
CpuAvg1 int64 `json:"cpu_avg1"`
|
|
CpuAvg15 int64 `json:"cpu_avg15"`
|
|
CpuAvg5 int64 `json:"cpu_avg5"`
|
|
MemoryCode int64 `json:"memory_code"`
|
|
MemoryEts int64 `json:"memory_ets"`
|
|
MemoryProcesses int64 `json:"memory_processes"`
|
|
MemorySystem int64 `json:"memory_system"`
|
|
MemoryTotal int64 `json:"memory_total"`
|
|
NodeGetFsmObjsize100 int64 `json:"node_get_fsm_objsize_100"`
|
|
NodeGetFsmObjsize95 int64 `json:"node_get_fsm_objsize_95"`
|
|
NodeGetFsmObjsize99 int64 `json:"node_get_fsm_objsize_99"`
|
|
NodeGetFsmObjsizeMean int64 `json:"node_get_fsm_objsize_mean"`
|
|
NodeGetFsmObjsizeMedian int64 `json:"node_get_fsm_objsize_median"`
|
|
NodeGetFsmSiblings100 int64 `json:"node_get_fsm_siblings_100"`
|
|
NodeGetFsmSiblings95 int64 `json:"node_get_fsm_siblings_95"`
|
|
NodeGetFsmSiblings99 int64 `json:"node_get_fsm_siblings_99"`
|
|
NodeGetFsmSiblingsMean int64 `json:"node_get_fsm_siblings_mean"`
|
|
NodeGetFsmSiblingsMedian int64 `json:"node_get_fsm_siblings_median"`
|
|
NodeGetFsmTime100 int64 `json:"node_get_fsm_time_100"`
|
|
NodeGetFsmTime95 int64 `json:"node_get_fsm_time_95"`
|
|
NodeGetFsmTime99 int64 `json:"node_get_fsm_time_99"`
|
|
NodeGetFsmTimeMean int64 `json:"node_get_fsm_time_mean"`
|
|
NodeGetFsmTimeMedian int64 `json:"node_get_fsm_time_median"`
|
|
NodeGets int64 `json:"node_gets"`
|
|
NodeGetsTotal int64 `json:"node_gets_total"`
|
|
Nodename string `json:"nodename"`
|
|
NodePutFsmTime100 int64 `json:"node_put_fsm_time_100"`
|
|
NodePutFsmTime95 int64 `json:"node_put_fsm_time_95"`
|
|
NodePutFsmTime99 int64 `json:"node_put_fsm_time_99"`
|
|
NodePutFsmTimeMean int64 `json:"node_put_fsm_time_mean"`
|
|
NodePutFsmTimeMedian int64 `json:"node_put_fsm_time_median"`
|
|
NodePuts int64 `json:"node_puts"`
|
|
NodePutsTotal int64 `json:"node_puts_total"`
|
|
PbcActive int64 `json:"pbc_active"`
|
|
PbcConnects int64 `json:"pbc_connects"`
|
|
PbcConnectsTotal int64 `json:"pbc_connects_total"`
|
|
VnodeGets int64 `json:"vnode_gets"`
|
|
VnodeGetsTotal int64 `json:"vnode_gets_total"`
|
|
VnodeIndexReads int64 `json:"vnode_index_reads"`
|
|
VnodeIndexReadsTotal int64 `json:"vnode_index_reads_total"`
|
|
VnodeIndexWrites int64 `json:"vnode_index_writes"`
|
|
VnodeIndexWritesTotal int64 `json:"vnode_index_writes_total"`
|
|
VnodePuts int64 `json:"vnode_puts"`
|
|
VnodePutsTotal int64 `json:"vnode_puts_total"`
|
|
ReadRepairs int64 `json:"read_repairs"`
|
|
ReadRepairsTotal int64 `json:"read_repairs_total"`
|
|
}
|
|
|
|
// A sample configuration to only gather stats from localhost, default port.
|
|
const sampleConfig = `
|
|
# Specify a list of one or more riak http servers
|
|
servers = ["http://localhost:8098"]
|
|
`
|
|
|
|
// Returns a sample configuration for the plugin
|
|
func (r *Riak) SampleConfig() string {
|
|
return sampleConfig
|
|
}
|
|
|
|
// Returns a description of the plugin
|
|
func (r *Riak) Description() string {
|
|
return "Read metrics one or many Riak servers"
|
|
}
|
|
|
|
// Reads stats from all configured servers.
|
|
func (r *Riak) Gather(acc telegraf.Accumulator) error {
|
|
// Default to a single server at localhost (default port) if none specified
|
|
if len(r.Servers) == 0 {
|
|
r.Servers = []string{"http://127.0.0.1:8098"}
|
|
}
|
|
|
|
// Range over all servers, gathering stats. Returns early in case of any error.
|
|
for _, s := range r.Servers {
|
|
acc.AddError(r.gatherServer(s, acc))
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// Gathers stats from a single server, adding them to the accumulator
|
|
func (r *Riak) gatherServer(s string, acc telegraf.Accumulator) error {
|
|
// Parse the given URL to extract the server tag
|
|
u, err := url.Parse(s)
|
|
if err != nil {
|
|
return fmt.Errorf("riak unable to parse given server url %s: %s", s, err)
|
|
}
|
|
|
|
// Perform the GET request to the riak /stats endpoint
|
|
resp, err := r.client.Get(s + "/stats")
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer resp.Body.Close()
|
|
|
|
// Successful responses will always return status code 200
|
|
if resp.StatusCode != http.StatusOK {
|
|
return fmt.Errorf("riak responded with unexpected status code %d", resp.StatusCode)
|
|
}
|
|
|
|
// Decode the response JSON into a new stats struct
|
|
stats := &riakStats{}
|
|
if err := json.NewDecoder(resp.Body).Decode(stats); err != nil {
|
|
return fmt.Errorf("unable to decode riak response: %s", err)
|
|
}
|
|
|
|
// Build a map of tags
|
|
tags := map[string]string{
|
|
"nodename": stats.Nodename,
|
|
"server": u.Host,
|
|
}
|
|
|
|
// Build a map of field values
|
|
fields := map[string]interface{}{
|
|
"cpu_avg1": stats.CpuAvg1,
|
|
"cpu_avg15": stats.CpuAvg15,
|
|
"cpu_avg5": stats.CpuAvg5,
|
|
"memory_code": stats.MemoryCode,
|
|
"memory_ets": stats.MemoryEts,
|
|
"memory_processes": stats.MemoryProcesses,
|
|
"memory_system": stats.MemorySystem,
|
|
"memory_total": stats.MemoryTotal,
|
|
"node_get_fsm_objsize_100": stats.NodeGetFsmObjsize100,
|
|
"node_get_fsm_objsize_95": stats.NodeGetFsmObjsize95,
|
|
"node_get_fsm_objsize_99": stats.NodeGetFsmObjsize99,
|
|
"node_get_fsm_objsize_mean": stats.NodeGetFsmObjsizeMean,
|
|
"node_get_fsm_objsize_median": stats.NodeGetFsmObjsizeMedian,
|
|
"node_get_fsm_siblings_100": stats.NodeGetFsmSiblings100,
|
|
"node_get_fsm_siblings_95": stats.NodeGetFsmSiblings95,
|
|
"node_get_fsm_siblings_99": stats.NodeGetFsmSiblings99,
|
|
"node_get_fsm_siblings_mean": stats.NodeGetFsmSiblingsMean,
|
|
"node_get_fsm_siblings_median": stats.NodeGetFsmSiblingsMedian,
|
|
"node_get_fsm_time_100": stats.NodeGetFsmTime100,
|
|
"node_get_fsm_time_95": stats.NodeGetFsmTime95,
|
|
"node_get_fsm_time_99": stats.NodeGetFsmTime99,
|
|
"node_get_fsm_time_mean": stats.NodeGetFsmTimeMean,
|
|
"node_get_fsm_time_median": stats.NodeGetFsmTimeMedian,
|
|
"node_gets": stats.NodeGets,
|
|
"node_gets_total": stats.NodeGetsTotal,
|
|
"node_put_fsm_time_100": stats.NodePutFsmTime100,
|
|
"node_put_fsm_time_95": stats.NodePutFsmTime95,
|
|
"node_put_fsm_time_99": stats.NodePutFsmTime99,
|
|
"node_put_fsm_time_mean": stats.NodePutFsmTimeMean,
|
|
"node_put_fsm_time_median": stats.NodePutFsmTimeMedian,
|
|
"node_puts": stats.NodePuts,
|
|
"node_puts_total": stats.NodePutsTotal,
|
|
"pbc_active": stats.PbcActive,
|
|
"pbc_connects": stats.PbcConnects,
|
|
"pbc_connects_total": stats.PbcConnectsTotal,
|
|
"vnode_gets": stats.VnodeGets,
|
|
"vnode_gets_total": stats.VnodeGetsTotal,
|
|
"vnode_index_reads": stats.VnodeIndexReads,
|
|
"vnode_index_reads_total": stats.VnodeIndexReadsTotal,
|
|
"vnode_index_writes": stats.VnodeIndexWrites,
|
|
"vnode_index_writes_total": stats.VnodeIndexWritesTotal,
|
|
"vnode_puts": stats.VnodePuts,
|
|
"vnode_puts_total": stats.VnodePutsTotal,
|
|
"read_repairs": stats.ReadRepairs,
|
|
"read_repairs_total": stats.ReadRepairsTotal,
|
|
}
|
|
|
|
// Accumulate the tags and values
|
|
acc.AddFields("riak", fields, tags)
|
|
|
|
return nil
|
|
}
|
|
|
|
func init() {
|
|
inputs.Add("riak", func() telegraf.Input {
|
|
return NewRiak()
|
|
})
|
|
}
|