2016-01-31 21:45:44 +00:00
|
|
|
package mesos
|
|
|
|
|
|
|
|
import (
|
|
|
|
"encoding/json"
|
2016-06-09 10:33:14 +00:00
|
|
|
"fmt"
|
2016-01-31 21:45:44 +00:00
|
|
|
"math/rand"
|
|
|
|
"net/http"
|
|
|
|
"net/http/httptest"
|
|
|
|
"os"
|
|
|
|
"testing"
|
|
|
|
|
|
|
|
"github.com/influxdata/telegraf/testutil"
|
|
|
|
)
|
|
|
|
|
2016-06-09 10:33:14 +00:00
|
|
|
var masterMetrics map[string]interface{}
|
|
|
|
var masterTestServer *httptest.Server
|
|
|
|
var slaveMetrics map[string]interface{}
|
2016-09-23 19:39:59 +00:00
|
|
|
|
|
|
|
// var slaveTaskMetrics map[string]interface{}
|
2016-06-09 10:33:14 +00:00
|
|
|
var slaveTestServer *httptest.Server
|
|
|
|
|
|
|
|
func randUUID() string {
|
|
|
|
b := make([]byte, 16)
|
|
|
|
rand.Read(b)
|
|
|
|
return fmt.Sprintf("%x-%x-%x-%x-%x", b[0:4], b[4:6], b[6:8], b[8:10], b[10:])
|
|
|
|
}
|
2016-01-31 21:45:44 +00:00
|
|
|
|
|
|
|
func generateMetrics() {
|
2016-06-09 10:33:14 +00:00
|
|
|
masterMetrics = make(map[string]interface{})
|
|
|
|
|
|
|
|
metricNames := []string{
|
|
|
|
// resources
|
|
|
|
"master/cpus_percent",
|
|
|
|
"master/cpus_used",
|
|
|
|
"master/cpus_total",
|
|
|
|
"master/cpus_revocable_percent",
|
|
|
|
"master/cpus_revocable_total",
|
|
|
|
"master/cpus_revocable_used",
|
|
|
|
"master/disk_percent",
|
|
|
|
"master/disk_used",
|
|
|
|
"master/disk_total",
|
|
|
|
"master/disk_revocable_percent",
|
|
|
|
"master/disk_revocable_total",
|
|
|
|
"master/disk_revocable_used",
|
|
|
|
"master/gpus_percent",
|
|
|
|
"master/gpus_used",
|
|
|
|
"master/gpus_total",
|
|
|
|
"master/gpus_revocable_percent",
|
|
|
|
"master/gpus_revocable_total",
|
|
|
|
"master/gpus_revocable_used",
|
|
|
|
"master/mem_percent",
|
|
|
|
"master/mem_used",
|
|
|
|
"master/mem_total",
|
|
|
|
"master/mem_revocable_percent",
|
|
|
|
"master/mem_revocable_total",
|
|
|
|
"master/mem_revocable_used",
|
|
|
|
// master
|
|
|
|
"master/elected",
|
|
|
|
"master/uptime_secs",
|
|
|
|
// system
|
|
|
|
"system/cpus_total",
|
|
|
|
"system/load_15min",
|
|
|
|
"system/load_5min",
|
|
|
|
"system/load_1min",
|
|
|
|
"system/mem_free_bytes",
|
|
|
|
"system/mem_total_bytes",
|
|
|
|
// agents
|
|
|
|
"master/slave_registrations",
|
|
|
|
"master/slave_removals",
|
|
|
|
"master/slave_reregistrations",
|
|
|
|
"master/slave_shutdowns_scheduled",
|
|
|
|
"master/slave_shutdowns_canceled",
|
|
|
|
"master/slave_shutdowns_completed",
|
|
|
|
"master/slaves_active",
|
|
|
|
"master/slaves_connected",
|
|
|
|
"master/slaves_disconnected",
|
|
|
|
"master/slaves_inactive",
|
|
|
|
// frameworks
|
|
|
|
"master/frameworks_active",
|
|
|
|
"master/frameworks_connected",
|
|
|
|
"master/frameworks_disconnected",
|
|
|
|
"master/frameworks_inactive",
|
|
|
|
"master/outstanding_offers",
|
|
|
|
// tasks
|
|
|
|
"master/tasks_error",
|
|
|
|
"master/tasks_failed",
|
|
|
|
"master/tasks_finished",
|
|
|
|
"master/tasks_killed",
|
|
|
|
"master/tasks_lost",
|
|
|
|
"master/tasks_running",
|
|
|
|
"master/tasks_staging",
|
|
|
|
"master/tasks_starting",
|
|
|
|
// messages
|
|
|
|
"master/invalid_executor_to_framework_messages",
|
|
|
|
"master/invalid_framework_to_executor_messages",
|
|
|
|
"master/invalid_status_update_acknowledgements",
|
|
|
|
"master/invalid_status_updates",
|
|
|
|
"master/dropped_messages",
|
|
|
|
"master/messages_authenticate",
|
|
|
|
"master/messages_deactivate_framework",
|
|
|
|
"master/messages_decline_offers",
|
|
|
|
"master/messages_executor_to_framework",
|
|
|
|
"master/messages_exited_executor",
|
|
|
|
"master/messages_framework_to_executor",
|
|
|
|
"master/messages_kill_task",
|
|
|
|
"master/messages_launch_tasks",
|
|
|
|
"master/messages_reconcile_tasks",
|
|
|
|
"master/messages_register_framework",
|
|
|
|
"master/messages_register_slave",
|
|
|
|
"master/messages_reregister_framework",
|
|
|
|
"master/messages_reregister_slave",
|
|
|
|
"master/messages_resource_request",
|
|
|
|
"master/messages_revive_offers",
|
|
|
|
"master/messages_status_update",
|
|
|
|
"master/messages_status_update_acknowledgement",
|
|
|
|
"master/messages_unregister_framework",
|
|
|
|
"master/messages_unregister_slave",
|
|
|
|
"master/messages_update_slave",
|
|
|
|
"master/recovery_slave_removals",
|
|
|
|
"master/slave_removals/reason_registered",
|
|
|
|
"master/slave_removals/reason_unhealthy",
|
|
|
|
"master/slave_removals/reason_unregistered",
|
|
|
|
"master/valid_framework_to_executor_messages",
|
|
|
|
"master/valid_status_update_acknowledgements",
|
|
|
|
"master/valid_status_updates",
|
|
|
|
"master/task_lost/source_master/reason_invalid_offers",
|
|
|
|
"master/task_lost/source_master/reason_slave_removed",
|
|
|
|
"master/task_lost/source_slave/reason_executor_terminated",
|
|
|
|
"master/valid_executor_to_framework_messages",
|
|
|
|
// evgqueue
|
|
|
|
"master/event_queue_dispatches",
|
|
|
|
"master/event_queue_http_requests",
|
|
|
|
"master/event_queue_messages",
|
|
|
|
// registrar
|
|
|
|
"registrar/state_fetch_ms",
|
|
|
|
"registrar/state_store_ms",
|
|
|
|
"registrar/state_store_ms/max",
|
|
|
|
"registrar/state_store_ms/min",
|
|
|
|
"registrar/state_store_ms/p50",
|
|
|
|
"registrar/state_store_ms/p90",
|
|
|
|
"registrar/state_store_ms/p95",
|
|
|
|
"registrar/state_store_ms/p99",
|
|
|
|
"registrar/state_store_ms/p999",
|
|
|
|
"registrar/state_store_ms/p9999",
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, k := range metricNames {
|
|
|
|
masterMetrics[k] = rand.Float64()
|
|
|
|
}
|
|
|
|
|
|
|
|
slaveMetrics = make(map[string]interface{})
|
|
|
|
|
|
|
|
metricNames = []string{
|
|
|
|
// resources
|
|
|
|
"slave/cpus_percent",
|
|
|
|
"slave/cpus_used",
|
|
|
|
"slave/cpus_total",
|
|
|
|
"slave/cpus_revocable_percent",
|
|
|
|
"slave/cpus_revocable_total",
|
|
|
|
"slave/cpus_revocable_used",
|
|
|
|
"slave/disk_percent",
|
|
|
|
"slave/disk_used",
|
|
|
|
"slave/disk_total",
|
|
|
|
"slave/disk_revocable_percent",
|
|
|
|
"slave/disk_revocable_total",
|
|
|
|
"slave/disk_revocable_used",
|
|
|
|
"slave/gpus_percent",
|
|
|
|
"slave/gpus_used",
|
|
|
|
"slave/gpus_total",
|
|
|
|
"slave/gpus_revocable_percent",
|
|
|
|
"slave/gpus_revocable_total",
|
|
|
|
"slave/gpus_revocable_used",
|
|
|
|
"slave/mem_percent",
|
|
|
|
"slave/mem_used",
|
|
|
|
"slave/mem_total",
|
|
|
|
"slave/mem_revocable_percent",
|
|
|
|
"slave/mem_revocable_total",
|
|
|
|
"slave/mem_revocable_used",
|
|
|
|
// agent
|
|
|
|
"slave/registered",
|
|
|
|
"slave/uptime_secs",
|
|
|
|
// system
|
|
|
|
"system/cpus_total",
|
|
|
|
"system/load_15min",
|
|
|
|
"system/load_5min",
|
|
|
|
"system/load_1min",
|
|
|
|
"system/mem_free_bytes",
|
|
|
|
"system/mem_total_bytes",
|
|
|
|
// executors
|
|
|
|
"containerizer/mesos/container_destroy_errors",
|
|
|
|
"slave/container_launch_errors",
|
|
|
|
"slave/executors_preempted",
|
|
|
|
"slave/frameworks_active",
|
|
|
|
"slave/executor_directory_max_allowed_age_secs",
|
|
|
|
"slave/executors_registering",
|
|
|
|
"slave/executors_running",
|
|
|
|
"slave/executors_terminated",
|
|
|
|
"slave/executors_terminating",
|
|
|
|
"slave/recovery_errors",
|
|
|
|
// tasks
|
|
|
|
"slave/tasks_failed",
|
|
|
|
"slave/tasks_finished",
|
|
|
|
"slave/tasks_killed",
|
|
|
|
"slave/tasks_lost",
|
|
|
|
"slave/tasks_running",
|
|
|
|
"slave/tasks_staging",
|
|
|
|
"slave/tasks_starting",
|
|
|
|
// messages
|
|
|
|
"slave/invalid_framework_messages",
|
|
|
|
"slave/invalid_status_updates",
|
|
|
|
"slave/valid_framework_messages",
|
|
|
|
"slave/valid_status_updates",
|
|
|
|
}
|
2016-01-31 21:45:44 +00:00
|
|
|
|
|
|
|
for _, k := range metricNames {
|
2016-06-09 10:33:14 +00:00
|
|
|
slaveMetrics[k] = rand.Float64()
|
|
|
|
}
|
|
|
|
|
2016-09-23 19:39:59 +00:00
|
|
|
// slaveTaskMetrics = map[string]interface{}{
|
|
|
|
// "executor_id": fmt.Sprintf("task_name.%s", randUUID()),
|
|
|
|
// "executor_name": "Some task description",
|
|
|
|
// "framework_id": randUUID(),
|
|
|
|
// "source": fmt.Sprintf("task_source.%s", randUUID()),
|
|
|
|
// "statistics": map[string]interface{}{
|
|
|
|
// "cpus_limit": rand.Float64(),
|
|
|
|
// "cpus_system_time_secs": rand.Float64(),
|
|
|
|
// "cpus_user_time_secs": rand.Float64(),
|
|
|
|
// "mem_anon_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_cache_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_critical_pressure_counter": float64(rand.Int63()),
|
|
|
|
// "mem_file_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_limit_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_low_pressure_counter": float64(rand.Int63()),
|
|
|
|
// "mem_mapped_file_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_medium_pressure_counter": float64(rand.Int63()),
|
|
|
|
// "mem_rss_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_swap_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_total_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_total_memsw_bytes": float64(rand.Int63()),
|
|
|
|
// "mem_unevictable_bytes": float64(rand.Int63()),
|
|
|
|
// "timestamp": rand.Float64(),
|
|
|
|
// },
|
|
|
|
// }
|
2016-01-31 21:45:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func TestMain(m *testing.M) {
|
|
|
|
generateMetrics()
|
2016-06-09 10:33:14 +00:00
|
|
|
|
|
|
|
masterRouter := http.NewServeMux()
|
|
|
|
masterRouter.HandleFunc("/metrics/snapshot", func(w http.ResponseWriter, r *http.Request) {
|
|
|
|
w.WriteHeader(http.StatusOK)
|
|
|
|
w.Header().Set("Content-Type", "application/json")
|
|
|
|
json.NewEncoder(w).Encode(masterMetrics)
|
|
|
|
})
|
|
|
|
masterTestServer = httptest.NewServer(masterRouter)
|
|
|
|
|
|
|
|
slaveRouter := http.NewServeMux()
|
|
|
|
slaveRouter.HandleFunc("/metrics/snapshot", func(w http.ResponseWriter, r *http.Request) {
|
|
|
|
w.WriteHeader(http.StatusOK)
|
|
|
|
w.Header().Set("Content-Type", "application/json")
|
|
|
|
json.NewEncoder(w).Encode(slaveMetrics)
|
|
|
|
})
|
2016-09-23 19:39:59 +00:00
|
|
|
// slaveRouter.HandleFunc("/monitor/statistics", func(w http.ResponseWriter, r *http.Request) {
|
|
|
|
// w.WriteHeader(http.StatusOK)
|
|
|
|
// w.Header().Set("Content-Type", "application/json")
|
|
|
|
// json.NewEncoder(w).Encode([]map[string]interface{}{slaveTaskMetrics})
|
|
|
|
// })
|
2016-06-09 10:33:14 +00:00
|
|
|
slaveTestServer = httptest.NewServer(slaveRouter)
|
|
|
|
|
2016-01-31 21:45:44 +00:00
|
|
|
rc := m.Run()
|
2016-06-09 10:33:14 +00:00
|
|
|
|
|
|
|
masterTestServer.Close()
|
|
|
|
slaveTestServer.Close()
|
2016-01-31 21:45:44 +00:00
|
|
|
os.Exit(rc)
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestMesosMaster(t *testing.T) {
|
|
|
|
var acc testutil.Accumulator
|
|
|
|
|
|
|
|
m := Mesos{
|
2016-06-09 10:33:14 +00:00
|
|
|
Masters: []string{masterTestServer.Listener.Addr().String()},
|
2016-02-10 23:57:36 +00:00
|
|
|
Timeout: 10,
|
2016-01-31 21:45:44 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
err := m.Gather(&acc)
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf(err.Error())
|
|
|
|
}
|
|
|
|
|
2016-06-09 10:33:14 +00:00
|
|
|
acc.AssertContainsFields(t, "mesos", masterMetrics)
|
2016-01-31 21:45:44 +00:00
|
|
|
}
|
|
|
|
|
2016-06-09 10:33:14 +00:00
|
|
|
func TestMasterFilter(t *testing.T) {
|
2016-02-04 01:46:20 +00:00
|
|
|
m := Mesos{
|
2016-02-11 00:06:51 +00:00
|
|
|
MasterCols: []string{
|
2016-02-04 01:46:20 +00:00
|
|
|
"resources", "master", "registrar",
|
|
|
|
},
|
|
|
|
}
|
|
|
|
b := []string{
|
2016-06-09 10:33:14 +00:00
|
|
|
"system", "agents", "frameworks",
|
|
|
|
"messages", "evqueue", "tasks",
|
|
|
|
}
|
|
|
|
|
|
|
|
m.filterMetrics(MASTER, &masterMetrics)
|
|
|
|
|
|
|
|
for _, v := range b {
|
|
|
|
for _, x := range getMetrics(MASTER, v) {
|
|
|
|
if _, ok := masterMetrics[x]; ok {
|
|
|
|
t.Errorf("Found key %s, it should be gone.", x)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
for _, v := range m.MasterCols {
|
|
|
|
for _, x := range getMetrics(MASTER, v) {
|
|
|
|
if _, ok := masterMetrics[x]; !ok {
|
|
|
|
t.Errorf("Didn't find key %s, it should present.", x)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestMesosSlave(t *testing.T) {
|
|
|
|
var acc testutil.Accumulator
|
|
|
|
|
|
|
|
m := Mesos{
|
2016-09-23 19:39:59 +00:00
|
|
|
Masters: []string{},
|
|
|
|
Slaves: []string{slaveTestServer.Listener.Addr().String()},
|
|
|
|
// SlaveTasks: true,
|
|
|
|
Timeout: 10,
|
2016-06-09 10:33:14 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
err := m.Gather(&acc)
|
|
|
|
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf(err.Error())
|
|
|
|
}
|
|
|
|
|
|
|
|
acc.AssertContainsFields(t, "mesos", slaveMetrics)
|
|
|
|
|
2016-09-23 19:39:59 +00:00
|
|
|
// expectedFields := make(map[string]interface{}, len(slaveTaskMetrics["statistics"].(map[string]interface{}))+1)
|
|
|
|
// for k, v := range slaveTaskMetrics["statistics"].(map[string]interface{}) {
|
|
|
|
// expectedFields[k] = v
|
|
|
|
// }
|
|
|
|
// expectedFields["executor_id"] = slaveTaskMetrics["executor_id"]
|
|
|
|
|
|
|
|
// acc.AssertContainsTaggedFields(
|
|
|
|
// t,
|
|
|
|
// "mesos_tasks",
|
|
|
|
// expectedFields,
|
|
|
|
// map[string]string{"server": "127.0.0.1", "framework_id": slaveTaskMetrics["framework_id"].(string)})
|
2016-06-09 10:33:14 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func TestSlaveFilter(t *testing.T) {
|
|
|
|
m := Mesos{
|
|
|
|
SlaveCols: []string{
|
|
|
|
"resources", "agent", "tasks",
|
|
|
|
},
|
|
|
|
}
|
|
|
|
b := []string{
|
|
|
|
"system", "executors", "messages",
|
2016-01-31 21:45:44 +00:00
|
|
|
}
|
|
|
|
|
2016-06-09 10:33:14 +00:00
|
|
|
m.filterMetrics(SLAVE, &slaveMetrics)
|
2016-01-31 21:45:44 +00:00
|
|
|
|
2016-02-04 01:46:20 +00:00
|
|
|
for _, v := range b {
|
2016-06-09 10:33:14 +00:00
|
|
|
for _, x := range getMetrics(SLAVE, v) {
|
|
|
|
if _, ok := slaveMetrics[x]; ok {
|
2016-02-03 02:31:39 +00:00
|
|
|
t.Errorf("Found key %s, it should be gone.", x)
|
|
|
|
}
|
2016-01-31 21:45:44 +00:00
|
|
|
}
|
|
|
|
}
|
2016-02-11 00:06:51 +00:00
|
|
|
for _, v := range m.MasterCols {
|
2016-06-09 10:33:14 +00:00
|
|
|
for _, x := range getMetrics(SLAVE, v) {
|
|
|
|
if _, ok := slaveMetrics[x]; !ok {
|
2016-02-10 23:57:36 +00:00
|
|
|
t.Errorf("Didn't find key %s, it should present.", x)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-01-31 21:45:44 +00:00
|
|
|
}
|