telegraf/plugins/inputs/ping/ping.go

261 lines
7.1 KiB
Go
Raw Permalink Normal View History

// +build !windows
2015-09-02 23:16:52 +00:00
package ping
import (
"errors"
"fmt"
2017-10-26 20:35:37 +00:00
"net"
2015-09-02 23:16:52 +00:00
"os/exec"
"runtime"
2015-09-02 23:16:52 +00:00
"strconv"
"strings"
"sync"
"syscall"
"time"
2015-09-02 23:16:52 +00:00
"github.com/influxdata/telegraf"
"github.com/influxdata/telegraf/internal"
2016-01-20 18:57:35 +00:00
"github.com/influxdata/telegraf/plugins/inputs"
2015-09-02 23:16:52 +00:00
)
// HostPinger is a function that runs the "ping" function using a list of
// passed arguments. This can be easily switched with a mocked ping function
// for unit test purposes (see ping_test.go)
type HostPinger func(timeout float64, args ...string) (string, error)
2015-09-02 23:16:52 +00:00
type Ping struct {
// Interval at which to ping (ping -i <INTERVAL>)
PingInterval float64 `toml:"ping_interval"`
// Number of pings to send (ping -c <COUNT>)
Count int
2016-06-10 11:51:43 +00:00
// Ping timeout, in seconds. 0 means no timeout (ping -W <TIMEOUT>)
2015-09-02 23:16:52 +00:00
Timeout float64
// Interface or source address to send ping from (ping -I/-S <INTERFACE/SRC_ADDR>)
2015-09-02 23:16:52 +00:00
Interface string
// URLs to ping
Urls []string
// host ping function
pingHost HostPinger
}
func (_ *Ping) Description() string {
return "Ping given url(s) and return statistics"
}
2016-04-27 21:08:38 +00:00
const sampleConfig = `
## NOTE: this plugin forks the ping command. You may need to set capabilities
## via setcap cap_net_raw+p /bin/ping
2016-04-27 21:08:38 +00:00
#
## List of urls to ping
urls = ["www.google.com"] # required
2016-04-27 21:08:38 +00:00
## number of pings to send per collection (ping -c <COUNT>)
# count = 1
## interval, in s, at which to ping. 0 == default (ping -i <PING_INTERVAL>)
# ping_interval = 1.0
2016-06-10 11:51:43 +00:00
## per-ping timeout, in s. 0 == no timeout (ping -W <TIMEOUT>)
# timeout = 1.0
## interface or source address to send ping from (ping -I <INTERFACE/SRC_ADDR>)
## on Darwin and Freebsd only source address possible: (ping -S <SRC_ADDR>)
# interface = ""
2015-09-02 23:16:52 +00:00
`
func (_ *Ping) SampleConfig() string {
return sampleConfig
}
func (p *Ping) Gather(acc telegraf.Accumulator) error {
2015-09-02 23:16:52 +00:00
var wg sync.WaitGroup
// Spin off a go routine for each url to ping
for _, url := range p.Urls {
wg.Add(1)
2016-04-27 21:08:38 +00:00
go func(u string) {
2015-09-02 23:16:52 +00:00
defer wg.Done()
2017-10-26 20:35:37 +00:00
tags := map[string]string{"url": u}
fields := map[string]interface{}{"result_code": 0}
_, err := net.LookupHost(u)
if err != nil {
acc.AddError(err)
fields["result_code"] = 1
acc.AddFields("ping", fields, tags)
return
}
2016-04-27 21:08:38 +00:00
args := p.args(u)
totalTimeout := float64(p.Count)*p.Timeout + float64(p.Count-1)*p.PingInterval
out, err := p.pingHost(totalTimeout, args...)
2015-09-02 23:16:52 +00:00
if err != nil {
// Some implementations of ping return a 1 exit code on
// timeout, if this occurs we will not exit and try to parse
// the output.
status := -1
if exitError, ok := err.(*exec.ExitError); ok {
if ws, ok := exitError.Sys().(syscall.WaitStatus); ok {
status = ws.ExitStatus()
}
}
if status != 1 {
// Combine go err + stderr output
out = strings.TrimSpace(out)
if len(out) > 0 {
acc.AddError(fmt.Errorf("%s, %s", out, err))
} else {
acc.AddError(err)
}
2017-10-26 20:35:37 +00:00
acc.AddFields("ping", fields, tags)
return
}
2015-09-02 23:16:52 +00:00
}
trans, rec, min, avg, max, stddev, err := processPingOutput(out)
2015-09-02 23:16:52 +00:00
if err != nil {
// fatal error
acc.AddError(fmt.Errorf("%s: %s", err, u))
2017-10-26 20:35:37 +00:00
acc.AddFields("ping", fields, tags)
2015-09-02 23:16:52 +00:00
return
}
// Calculate packet loss percentage
loss := float64(trans-rec) / float64(trans) * 100.0
2017-10-26 20:35:37 +00:00
fields["packets_transmitted"] = trans
fields["packets_received"] = rec
fields["percent_packet_loss"] = loss
if min > 0 {
fields["minimum_response_ms"] = min
}
if avg > 0 {
fields["average_response_ms"] = avg
2015-12-15 00:03:33 +00:00
}
if max > 0 {
fields["maximum_response_ms"] = max
}
if stddev > 0 {
fields["standard_deviation_ms"] = stddev
}
2015-12-15 00:03:33 +00:00
acc.AddFields("ping", fields, tags)
2016-04-27 21:08:38 +00:00
}(url)
2015-09-02 23:16:52 +00:00
}
wg.Wait()
2017-04-24 18:13:26 +00:00
return nil
2015-09-02 23:16:52 +00:00
}
func hostPinger(timeout float64, args ...string) (string, error) {
bin, err := exec.LookPath("ping")
if err != nil {
return "", err
}
c := exec.Command(bin, args...)
out, err := internal.CombinedOutputTimeout(c,
time.Second*time.Duration(timeout+5))
2015-09-02 23:16:52 +00:00
return string(out), err
}
// args returns the arguments for the 'ping' executable
func (p *Ping) args(url string) []string {
// Build the ping command args based on toml config
args := []string{"-c", strconv.Itoa(p.Count), "-n", "-s", "16"}
2015-09-02 23:16:52 +00:00
if p.PingInterval > 0 {
args = append(args, "-i", strconv.FormatFloat(p.PingInterval, 'f', 1, 64))
}
if p.Timeout > 0 {
switch runtime.GOOS {
2016-06-10 11:51:43 +00:00
case "darwin":
2016-06-22 17:21:07 +00:00
args = append(args, "-W", strconv.FormatFloat(p.Timeout*1000, 'f', 1, 64))
case "linux":
args = append(args, "-W", strconv.FormatFloat(p.Timeout, 'f', 1, 64))
default:
// Not sure the best option here, just assume GNU ping?
args = append(args, "-W", strconv.FormatFloat(p.Timeout, 'f', 1, 64))
}
2015-09-02 23:16:52 +00:00
}
if p.Interface != "" {
switch runtime.GOOS {
case "linux":
args = append(args, "-I", p.Interface)
case "freebsd", "darwin":
args = append(args, "-S", p.Interface)
default:
// Not sure the best option here, just assume GNU ping?
args = append(args, "-I", p.Interface)
}
2015-09-02 23:16:52 +00:00
}
args = append(args, url)
return args
}
// processPingOutput takes in a string output from the ping command, like:
//
// PING www.google.com (173.194.115.84): 56 data bytes
// 64 bytes from 173.194.115.84: icmp_seq=0 ttl=54 time=52.172 ms
// 64 bytes from 173.194.115.84: icmp_seq=1 ttl=54 time=34.843 ms
//
// --- www.google.com ping statistics ---
// 2 packets transmitted, 2 packets received, 0.0% packet loss
// round-trip min/avg/max/stddev = 34.843/43.508/52.172/8.664 ms
//
// It returns (<transmitted packets>, <received packets>, <average response>)
func processPingOutput(out string) (int, int, float64, float64, float64, float64, error) {
2015-09-02 23:16:52 +00:00
var trans, recv int
var min, avg, max, stddev float64
2015-09-02 23:16:52 +00:00
// Set this error to nil if we find a 'transmitted' line
err := errors.New("Fatal error processing ping output")
lines := strings.Split(out, "\n")
for _, line := range lines {
if strings.Contains(line, "transmitted") &&
strings.Contains(line, "received") {
stats := strings.Split(line, ", ")
// Transmitted packets
trans, err = strconv.Atoi(strings.Split(stats[0], " ")[0])
if err != nil {
return trans, recv, min, avg, max, stddev, err
2015-09-02 23:16:52 +00:00
}
// Received packets
recv, err = strconv.Atoi(strings.Split(stats[1], " ")[0])
if err != nil {
return trans, recv, min, avg, max, stddev, err
2015-09-02 23:16:52 +00:00
}
} else if strings.Contains(line, "min/avg/max") {
stats := strings.Split(line, " ")[3]
min, err = strconv.ParseFloat(strings.Split(stats, "/")[0], 64)
2017-10-26 20:35:37 +00:00
if err != nil {
return trans, recv, min, avg, max, stddev, err
}
2015-09-02 23:16:52 +00:00
avg, err = strconv.ParseFloat(strings.Split(stats, "/")[1], 64)
2017-10-26 20:35:37 +00:00
if err != nil {
return trans, recv, min, avg, max, stddev, err
}
max, err = strconv.ParseFloat(strings.Split(stats, "/")[2], 64)
2017-10-26 20:35:37 +00:00
if err != nil {
return trans, recv, min, avg, max, stddev, err
}
stddev, err = strconv.ParseFloat(strings.Split(stats, "/")[3], 64)
2015-09-02 23:16:52 +00:00
if err != nil {
return trans, recv, min, avg, max, stddev, err
2015-09-02 23:16:52 +00:00
}
}
}
return trans, recv, min, avg, max, stddev, err
2015-09-02 23:16:52 +00:00
}
func init() {
inputs.Add("ping", func() telegraf.Input {
return &Ping{
pingHost: hostPinger,
PingInterval: 1.0,
Count: 1,
Timeout: 1.0,
}
2015-09-02 23:16:52 +00:00
})
}