monitorcmd.go 11.1 KB
Newer Older
1 2 3 4 5 6 7 8 9 10
// Copyright 2015 The go-ethereum Authors
// This file is part of go-ethereum.
//
// go-ethereum is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
// go-ethereum is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
11
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 13 14
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
15
// along with go-ethereum. If not, see <http://www.gnu.org/licenses/>.
16

17 18 19
package main

import (
20
	"fmt"
21
	"math"
22
	"reflect"
23
	"runtime"
24
	"sort"
25 26 27 28
	"strings"
	"time"

	"github.com/ethereum/go-ethereum/cmd/utils"
29
	"github.com/ethereum/go-ethereum/node"
30 31
	"github.com/ethereum/go-ethereum/rpc"
	"github.com/gizak/termui"
32
	"gopkg.in/urfave/cli.v1"
33 34
)

35 36 37
var (
	monitorCommandAttachFlag = cli.StringFlag{
		Name:  "attach",
38
		Value: node.DefaultIPCEndpoint(clientIdentifier),
39
		Usage: "API endpoint to attach to",
40 41 42 43
	}
	monitorCommandRowsFlag = cli.IntFlag{
		Name:  "rows",
		Value: 5,
44 45 46 47 48 49
		Usage: "Maximum rows in the chart grid",
	}
	monitorCommandRefreshFlag = cli.IntFlag{
		Name:  "refresh",
		Value: 3,
		Usage: "Refresh interval in seconds",
50 51
	}
	monitorCommand = cli.Command{
52
		Action:    utils.MigrateFlags(monitor), // keep track of migration progress
53 54 55 56
		Name:      "monitor",
		Usage:     "Monitor and visualize node metrics",
		ArgsUsage: " ",
		Category:  "MONITOR COMMANDS",
57 58 59 60 61 62 63 64
		Description: `
The Geth monitor is a tool to collect and visualize various internal metrics
gathered by the node, supporting different chart types as well as the capacity
to display multiple metrics simultaneously.
`,
		Flags: []cli.Flag{
			monitorCommandAttachFlag,
			monitorCommandRowsFlag,
65
			monitorCommandRefreshFlag,
66 67 68 69
		},
	}
)

70
// monitor starts a terminal UI based monitoring tool for the requested metrics.
71
func monitor(ctx *cli.Context) error {
72
	var (
73
		client *rpc.Client
74 75 76
		err    error
	)
	// Attach to an Ethereum node over IPC or RPC
77
	endpoint := ctx.String(monitorCommandAttachFlag.Name)
78
	if client, err = dialRPC(endpoint); err != nil {
79
		utils.Fatalf("Unable to attach to geth node: %v", err)
80 81 82 83
	}
	defer client.Close()

	// Retrieve all the available metrics and resolve the user pattens
84
	metrics, err := retrieveMetrics(client)
85 86 87
	if err != nil {
		utils.Fatalf("Failed to retrieve system metrics: %v", err)
	}
88
	monitored := resolveMetrics(metrics, ctx.Args())
89
	if len(monitored) == 0 {
90
		list := expandMetrics(metrics, "")
91
		sort.Strings(list)
92 93 94 95

		if len(list) > 0 {
			utils.Fatalf("No metrics specified.\n\nAvailable:\n - %s", strings.Join(list, "\n - "))
		} else {
96
			utils.Fatalf("No metrics collected by geth (--%s).\n", utils.MetricsEnabledFlag.Name)
97
		}
98
	}
99
	sort.Strings(monitored)
100 101 102
	if cols := len(monitored) / ctx.Int(monitorCommandRowsFlag.Name); cols > 6 {
		utils.Fatalf("Requested metrics (%d) spans more that 6 columns:\n - %s", len(monitored), strings.Join(monitored, "\n - "))
	}
103
	// Create and configure the chart UI defaults
104 105 106 107 108
	if err := termui.Init(); err != nil {
		utils.Fatalf("Unable to initialize terminal UI: %v", err)
	}
	defer termui.Close()

109
	rows := len(monitored)
110 111
	if max := ctx.Int(monitorCommandRowsFlag.Name); rows > max {
		rows = max
112
	}
113 114 115 116 117
	cols := (len(monitored) + rows - 1) / rows
	for i := 0; i < rows; i++ {
		termui.Body.AddRows(termui.NewRow())
	}
	// Create each individual data chart
118
	footer := termui.NewPar("")
119
	footer.Block.Border = true
120 121
	footer.Height = 3

122
	charts := make([]*termui.LineChart, len(monitored))
123
	units := make([]int, len(monitored))
124
	data := make([][]float64, len(monitored))
125 126
	for i := 0; i < len(monitored); i++ {
		charts[i] = createChart((termui.TermHeight() - footer.Height) / rows)
127 128
		row := termui.Body.Rows[i%rows]
		row.Cols = append(row.Cols, termui.NewCol(12/cols, 0, charts[i]))
129
	}
130
	termui.Body.AddRows(termui.NewRow(termui.NewCol(12, 0, footer)))
131

132
	refreshCharts(client, monitored, data, units, charts, ctx, footer)
133
	termui.Body.Align()
134 135 136
	termui.Render(termui.Body)

	// Watch for various system events, and periodically refresh the charts
137 138 139 140 141 142 143 144 145 146 147 148 149 150
	termui.Handle("/sys/kbd/C-c", func(termui.Event) {
		termui.StopLoop()
	})
	termui.Handle("/sys/wnd/resize", func(termui.Event) {
		termui.Body.Width = termui.TermWidth()
		for _, chart := range charts {
			chart.Height = (termui.TermHeight() - footer.Height) / rows
		}
		termui.Body.Align()
		termui.Render(termui.Body)
	})
	go func() {
		tick := time.NewTicker(time.Duration(ctx.Int(monitorCommandRefreshFlag.Name)) * time.Second)
		for range tick.C {
151
			if refreshCharts(client, monitored, data, units, charts, ctx, footer) {
152 153
				termui.Body.Align()
			}
154 155
			termui.Render(termui.Body)
		}
156 157
	}()
	termui.Loop()
158
	return nil
159 160
}

161 162
// retrieveMetrics contacts the attached geth node and retrieves the entire set
// of collected system metrics.
163 164 165 166
func retrieveMetrics(client *rpc.Client) (map[string]interface{}, error) {
	var metrics map[string]interface{}
	err := client.Call(&metrics, "debug_metrics", true)
	return metrics, err
167 168
}

169 170 171 172 173 174 175 176 177 178 179 180 181
// resolveMetrics takes a list of input metric patterns, and resolves each to one
// or more canonical metric names.
func resolveMetrics(metrics map[string]interface{}, patterns []string) []string {
	res := []string{}
	for _, pattern := range patterns {
		res = append(res, resolveMetric(metrics, pattern, "")...)
	}
	return res
}

// resolveMetrics takes a single of input metric pattern, and resolves it to one
// or more canonical metric names.
func resolveMetric(metrics map[string]interface{}, pattern string, path string) []string {
182 183 184 185 186 187 188 189 190 191 192 193
	results := []string{}

	// If a nested metric was requested, recurse optionally branching (via comma)
	parts := strings.SplitN(pattern, "/", 2)
	if len(parts) > 1 {
		for _, variation := range strings.Split(parts[0], ",") {
			if submetrics, ok := metrics[variation].(map[string]interface{}); !ok {
				utils.Fatalf("Failed to retrieve system metrics: %s", path+variation)
				return nil
			} else {
				results = append(results, resolveMetric(submetrics, parts[1], path+variation+"/")...)
			}
194
		}
195
		return results
196 197
	}
	// Depending what the last link is, return or expand
198 199 200 201 202
	for _, variation := range strings.Split(pattern, ",") {
		switch metric := metrics[variation].(type) {
		case float64:
			// Final metric value found, return as singleton
			results = append(results, path+variation)
203

204 205
		case map[string]interface{}:
			results = append(results, expandMetrics(metric, path+variation+"/")...)
206

207 208 209 210
		default:
			utils.Fatalf("Metric pattern resolved to unexpected type: %v", reflect.TypeOf(metric))
			return nil
		}
211
	}
212
	return results
213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235
}

// expandMetrics expands the entire tree of metrics into a flat list of paths.
func expandMetrics(metrics map[string]interface{}, path string) []string {
	// Iterate over all fields and expand individually
	list := []string{}
	for name, metric := range metrics {
		switch metric := metric.(type) {
		case float64:
			// Final metric value found, append to list
			list = append(list, path+name)

		case map[string]interface{}:
			// Tree of metrics found, expand recursively
			list = append(list, expandMetrics(metric, path+name+"/")...)

		default:
			utils.Fatalf("Metric pattern %s resolved to unexpected type: %v", path+name, reflect.TypeOf(metric))
			return nil
		}
	}
	return list
}
236

237 238
// fetchMetric iterates over the metrics map and retrieves a specific one.
func fetchMetric(metrics map[string]interface{}, metric string) float64 {
239
	parts := strings.Split(metric, "/")
240
	for _, part := range parts[:len(parts)-1] {
241
		var found bool
242 243 244 245 246 247 248 249 250 251 252 253 254
		metrics, found = metrics[part].(map[string]interface{})
		if !found {
			return 0
		}
	}
	if v, ok := metrics[parts[len(parts)-1]].(float64); ok {
		return v
	}
	return 0
}

// refreshCharts retrieves a next batch of metrics, and inserts all the new
// values into the active datasets and charts
255
func refreshCharts(client *rpc.Client, metrics []string, data [][]float64, units []int, charts []*termui.LineChart, ctx *cli.Context, footer *termui.Par) (realign bool) {
256
	values, err := retrieveMetrics(client)
257
	for i, metric := range metrics {
258 259 260 261 262
		if len(data) < 512 {
			data[i] = append([]float64{fetchMetric(values, metric)}, data[i]...)
		} else {
			data[i] = append([]float64{fetchMetric(values, metric)}, data[i][:len(data[i])-1]...)
		}
263 264 265
		if updateChart(metric, data[i], &units[i], charts[i], err) {
			realign = true
		}
266 267
	}
	updateFooter(ctx, err, footer)
268
	return
269 270
}

271 272
// updateChart inserts a dataset into a line chart, scaling appropriately as to
// not display weird labels, also updating the chart label accordingly.
273
func updateChart(metric string, data []float64, base *int, chart *termui.LineChart, err error) (realign bool) {
274 275 276
	dataUnits := []string{"", "K", "M", "G", "T", "E"}
	timeUnits := []string{"ns", "µs", "ms", "s", "ks", "ms"}
	colors := []termui.Attribute{termui.ColorBlue, termui.ColorCyan, termui.ColorGreen, termui.ColorYellow, termui.ColorRed, termui.ColorRed}
277

278
	// Extract only part of the data that's actually visible
279 280 281
	if chart.Width*2 < len(data) {
		data = data[:chart.Width*2]
	}
282
	// Find the maximum value and scale under 1K
283 284 285 286 287 288
	high := 0.0
	if len(data) > 0 {
		high = data[0]
		for _, value := range data[1:] {
			high = math.Max(high, value)
		}
289 290
	}
	unit, scale := 0, 1.0
291
	for high >= 1000 && unit+1 < len(dataUnits) {
292 293
		high, unit, scale = high/1000, unit+1, scale*1000
	}
294 295 296 297
	// If the unit changes, re-create the chart (hack to set max height...)
	if unit != *base {
		realign, *base, *chart = true, unit, *createChart(chart.Height)
	}
298
	// Update the chart's data points with the scaled values
299 300 301 302
	if cap(chart.Data) < len(data) {
		chart.Data = make([]float64, len(data))
	}
	chart.Data = chart.Data[:len(data)]
303 304 305 306
	for i, value := range data {
		chart.Data[i] = value / scale
	}
	// Update the chart's label with the scale units
307
	units := dataUnits
308
	if strings.Contains(metric, "/Percentiles/") || strings.Contains(metric, "/pauses/") || strings.Contains(metric, "/time/") {
309 310
		units = timeUnits
	}
311
	chart.BorderLabel = metric
312
	if len(units[unit]) > 0 {
313
		chart.BorderLabel += " [" + units[unit] + "]"
314
	}
315 316 317 318
	chart.LineColor = colors[unit] | termui.AttrBold
	if err != nil {
		chart.LineColor = termui.ColorRed | termui.AttrBold
	}
319 320 321 322 323 324 325 326 327 328 329 330 331 332
	return
}

// createChart creates an empty line chart with the default configs.
func createChart(height int) *termui.LineChart {
	chart := termui.NewLineChart()
	if runtime.GOOS == "windows" {
		chart.Mode = "dot"
	}
	chart.DataLabels = []string{""}
	chart.Height = height
	chart.AxesColor = termui.ColorWhite
	chart.PaddingBottom = -2

333 334
	chart.BorderLabelFg = chart.BorderFg | termui.AttrBold
	chart.BorderFg = chart.BorderBg
335 336

	return chart
337 338 339 340 341 342
}

// updateFooter updates the footer contents based on any encountered errors.
func updateFooter(ctx *cli.Context, err error, footer *termui.Par) {
	// Generate the basic footer
	refresh := time.Duration(ctx.Int(monitorCommandRefreshFlag.Name)) * time.Second
343
	footer.Text = fmt.Sprintf("Press Ctrl+C to quit. Refresh interval: %v.", refresh)
344
	footer.TextFgColor = termui.ThemeAttr("par.fg") | termui.AttrBold
345 346 347 348 349 350

	// Append any encountered errors
	if err != nil {
		footer.Text = fmt.Sprintf("Error: %v.", err)
		footer.TextFgColor = termui.ColorRed | termui.AttrBold
	}
351
}