package mesos import ( "encoding/json" "fmt" "math/rand" "net/http" "net/http/httptest" "os" "testing" jsonparser "github.com/influxdata/telegraf/plugins/parsers/json" "github.com/influxdata/telegraf/testutil" ) var masterMetrics map[string]interface{} var masterTestServer *httptest.Server var slaveMetrics map[string]interface{} var slaveTaskMetrics map[string]interface{} var slaveTestServer *httptest.Server func randUUID() string { b := make([]byte, 16) rand.Read(b) return fmt.Sprintf("%x-%x-%x-%x-%x", b[0:4], b[4:6], b[6:8], b[8:10], b[10:]) } func generateMetrics() { masterMetrics = make(map[string]interface{}) metricNames := []string{ // resources "master/cpus_percent", "master/cpus_used", "master/cpus_total", "master/cpus_revocable_percent", "master/cpus_revocable_total", "master/cpus_revocable_used", "master/disk_percent", "master/disk_used", "master/disk_total", "master/disk_revocable_percent", "master/disk_revocable_total", "master/disk_revocable_used", "master/gpus_percent", "master/gpus_used", "master/gpus_total", "master/gpus_revocable_percent", "master/gpus_revocable_total", "master/gpus_revocable_used", "master/mem_percent", "master/mem_used", "master/mem_total", "master/mem_revocable_percent", "master/mem_revocable_total", "master/mem_revocable_used", // master "master/elected", "master/uptime_secs", // system "system/cpus_total", "system/load_15min", "system/load_5min", "system/load_1min", "system/mem_free_bytes", "system/mem_total_bytes", // agents "master/slave_registrations", "master/slave_removals", "master/slave_reregistrations", "master/slave_shutdowns_scheduled", "master/slave_shutdowns_canceled", "master/slave_shutdowns_completed", "master/slaves_active", "master/slaves_connected", "master/slaves_disconnected", "master/slaves_inactive", // frameworks "master/frameworks_active", "master/frameworks_connected", "master/frameworks_disconnected", "master/frameworks_inactive", "master/outstanding_offers", // tasks "master/tasks_error", "master/tasks_failed", "master/tasks_finished", "master/tasks_killed", "master/tasks_lost", "master/tasks_running", "master/tasks_staging", "master/tasks_starting", // messages "master/invalid_executor_to_framework_messages", "master/invalid_framework_to_executor_messages", "master/invalid_status_update_acknowledgements", "master/invalid_status_updates", "master/dropped_messages", "master/messages_authenticate", "master/messages_deactivate_framework", "master/messages_decline_offers", "master/messages_executor_to_framework", "master/messages_exited_executor", "master/messages_framework_to_executor", "master/messages_kill_task", "master/messages_launch_tasks", "master/messages_reconcile_tasks", "master/messages_register_framework", "master/messages_register_slave", "master/messages_reregister_framework", "master/messages_reregister_slave", "master/messages_resource_request", "master/messages_revive_offers", "master/messages_status_update", "master/messages_status_update_acknowledgement", "master/messages_unregister_framework", "master/messages_unregister_slave", "master/messages_update_slave", "master/recovery_slave_removals", "master/slave_removals/reason_registered", "master/slave_removals/reason_unhealthy", "master/slave_removals/reason_unregistered", "master/valid_framework_to_executor_messages", "master/valid_status_update_acknowledgements", "master/valid_status_updates", "master/task_lost/source_master/reason_invalid_offers", "master/task_lost/source_master/reason_slave_removed", "master/task_lost/source_slave/reason_executor_terminated", "master/valid_executor_to_framework_messages", // evgqueue "master/event_queue_dispatches", "master/event_queue_http_requests", "master/event_queue_messages", // registrar "registrar/state_fetch_ms", "registrar/state_store_ms", "registrar/state_store_ms/max", "registrar/state_store_ms/min", "registrar/state_store_ms/p50", "registrar/state_store_ms/p90", "registrar/state_store_ms/p95", "registrar/state_store_ms/p99", "registrar/state_store_ms/p999", "registrar/state_store_ms/p9999", } for _, k := range metricNames { masterMetrics[k] = rand.Float64() } slaveMetrics = make(map[string]interface{}) metricNames = []string{ // resources "slave/cpus_percent", "slave/cpus_used", "slave/cpus_total", "slave/cpus_revocable_percent", "slave/cpus_revocable_total", "slave/cpus_revocable_used", "slave/disk_percent", "slave/disk_used", "slave/disk_total", "slave/disk_revocable_percent", "slave/disk_revocable_total", "slave/disk_revocable_used", "slave/gpus_percent", "slave/gpus_used", "slave/gpus_total", "slave/gpus_revocable_percent", "slave/gpus_revocable_total", "slave/gpus_revocable_used", "slave/mem_percent", "slave/mem_used", "slave/mem_total", "slave/mem_revocable_percent", "slave/mem_revocable_total", "slave/mem_revocable_used", // agent "slave/registered", "slave/uptime_secs", // system "system/cpus_total", "system/load_15min", "system/load_5min", "system/load_1min", "system/mem_free_bytes", "system/mem_total_bytes", // executors "containerizer/mesos/container_destroy_errors", "slave/container_launch_errors", "slave/executors_preempted", "slave/frameworks_active", "slave/executor_directory_max_allowed_age_secs", "slave/executors_registering", "slave/executors_running", "slave/executors_terminated", "slave/executors_terminating", "slave/recovery_errors", // tasks "slave/tasks_failed", "slave/tasks_finished", "slave/tasks_killed", "slave/tasks_lost", "slave/tasks_running", "slave/tasks_staging", "slave/tasks_starting", // messages "slave/invalid_framework_messages", "slave/invalid_status_updates", "slave/valid_framework_messages", "slave/valid_status_updates", } for _, k := range metricNames { slaveMetrics[k] = rand.Float64() } slaveTaskMetrics = map[string]interface{}{ "executor_id": fmt.Sprintf("task_%s", randUUID()), "executor_name": "Some task description", "framework_id": randUUID(), "source": fmt.Sprintf("task_source_%s", randUUID()), "statistics": map[string]interface{}{ "cpus_limit": rand.Float64(), "cpus_system_time_secs": rand.Float64(), "cpus_user_time_secs": rand.Float64(), "mem_anon_bytes": float64(rand.Int63()), "mem_cache_bytes": float64(rand.Int63()), "mem_critical_pressure_counter": float64(rand.Int63()), "mem_file_bytes": float64(rand.Int63()), "mem_limit_bytes": float64(rand.Int63()), "mem_low_pressure_counter": float64(rand.Int63()), "mem_mapped_file_bytes": float64(rand.Int63()), "mem_medium_pressure_counter": float64(rand.Int63()), "mem_rss_bytes": float64(rand.Int63()), "mem_swap_bytes": float64(rand.Int63()), "mem_total_bytes": float64(rand.Int63()), "mem_total_memsw_bytes": float64(rand.Int63()), "mem_unevictable_bytes": float64(rand.Int63()), "timestamp": rand.Float64(), }, } } func TestMain(m *testing.M) { generateMetrics() masterRouter := http.NewServeMux() masterRouter.HandleFunc("/metrics/snapshot", func(w http.ResponseWriter, r *http.Request) { w.WriteHeader(http.StatusOK) w.Header().Set("Content-Type", "application/json") json.NewEncoder(w).Encode(masterMetrics) }) masterTestServer = httptest.NewServer(masterRouter) slaveRouter := http.NewServeMux() slaveRouter.HandleFunc("/metrics/snapshot", func(w http.ResponseWriter, r *http.Request) { w.WriteHeader(http.StatusOK) w.Header().Set("Content-Type", "application/json") json.NewEncoder(w).Encode(slaveMetrics) }) slaveRouter.HandleFunc("/monitor/statistics", func(w http.ResponseWriter, r *http.Request) { w.WriteHeader(http.StatusOK) w.Header().Set("Content-Type", "application/json") json.NewEncoder(w).Encode([]map[string]interface{}{slaveTaskMetrics}) }) slaveTestServer = httptest.NewServer(slaveRouter) rc := m.Run() masterTestServer.Close() slaveTestServer.Close() os.Exit(rc) } func TestMesosMaster(t *testing.T) { var acc testutil.Accumulator m := Mesos{ Masters: []string{masterTestServer.Listener.Addr().String()}, Timeout: 10, } err := m.Gather(&acc) if err != nil { t.Errorf(err.Error()) } acc.AssertContainsFields(t, "mesos", masterMetrics) } func TestMasterFilter(t *testing.T) { m := Mesos{ MasterCols: []string{ "resources", "master", "registrar", }, } b := []string{ "system", "agents", "frameworks", "messages", "evqueue", "tasks", } m.filterMetrics(MASTER, &masterMetrics) for _, v := range b { for _, x := range getMetrics(MASTER, v) { if _, ok := masterMetrics[x]; ok { t.Errorf("Found key %s, it should be gone.", x) } } } for _, v := range m.MasterCols { for _, x := range getMetrics(MASTER, v) { if _, ok := masterMetrics[x]; !ok { t.Errorf("Didn't find key %s, it should present.", x) } } } } func TestMesosSlave(t *testing.T) { var acc testutil.Accumulator m := Mesos{ Masters: []string{}, Slaves: []string{slaveTestServer.Listener.Addr().String()}, SlaveTasks: true, Timeout: 10, } err := m.Gather(&acc) if err != nil { t.Errorf(err.Error()) } acc.AssertContainsFields(t, "mesos", slaveMetrics) jf := jsonparser.JSONFlattener{} err = jf.FlattenJSON("", slaveTaskMetrics) if err != nil { t.Errorf(err.Error()) } acc.AssertContainsFields(t, "mesos-tasks", jf.Fields) } func TestSlaveFilter(t *testing.T) { m := Mesos{ SlaveCols: []string{ "resources", "agent", "tasks", }, } b := []string{ "system", "executors", "messages", } m.filterMetrics(SLAVE, &slaveMetrics) for _, v := range b { for _, x := range getMetrics(SLAVE, v) { if _, ok := slaveMetrics[x]; ok { t.Errorf("Found key %s, it should be gone.", x) } } } for _, v := range m.MasterCols { for _, x := range getMetrics(SLAVE, v) { if _, ok := slaveMetrics[x]; !ok { t.Errorf("Didn't find key %s, it should present.", x) } } } }