Add metrics

This commit is contained in:
Sean Braithwaite 2019-08-03 08:32:52 +02:00
parent 4bd619c329
commit f9a5f17f91
2 changed files with 146 additions and 6 deletions

124
blockchain/v2/metrics.go Normal file
View File

@ -0,0 +1,124 @@
package v2
import (
"github.com/go-kit/kit/metrics"
"github.com/go-kit/kit/metrics/discard"
"github.com/go-kit/kit/metrics/prometheus"
stdprometheus "github.com/prometheus/client_golang/prometheus"
)
const (
// MetricsSubsystem is a subsystem shared by all metrics exposed by this
// package.
MetricsSubsystem = "blockchain"
)
// Metrics contains metrics exposed by this package.
type Metrics struct {
// events_in
EventsIn metrics.Counter
// events_in
EventsHandled metrics.Counter
// events_out
EventsOut metrics.Counter
// errors_in
ErrorsIn metrics.Counter
// errors_handled
ErrorsHandled metrics.Counter
// errors_out
ErrorsOut metrics.Counter
// events_shed
EventsShed metrics.Counter
// events_sent
EventsSent metrics.Counter
// errors_sent
ErrorsSent metrics.Counter
// errors_shed
ErrorsShed metrics.Counter
}
// Can we burn in the routine name here?
func PrometheusMetrics(namespace string, labelsAndValues ...string) *Metrics {
labels := []string{}
for i := 0; i < len(labelsAndValues); i += 2 {
labels = append(labels, labelsAndValues[i])
}
return &Metrics{
EventsIn: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "events_in",
Help: "Events read from the channel.",
}, labels).With(labelsAndValues...),
EventsHandled: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "events_handled",
Help: "Events handled",
}, labels).With(labelsAndValues...),
EventsOut: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "events_out",
Help: "Events output from routine.",
}, labels).With(labelsAndValues...),
ErrorsIn: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "errors_in",
Help: "Errors read from the channel.",
}, labels).With(labelsAndValues...),
ErrorsHandled: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "errors_handled",
Help: "Errors handled.",
}, labels).With(labelsAndValues...),
ErrorsOut: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "errors_out",
Help: "Errors output from routine.",
}, labels).With(labelsAndValues...),
ErrorsSent: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "errors_sent",
Help: "Errors sent to routine.",
}, labels).With(labelsAndValues...),
ErrorsShed: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "errors_shed",
Help: "Errors dropped from sending.",
}, labels).With(labelsAndValues...),
EventsSent: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "events_sent",
Help: "Events sent to routine.",
}, labels).With(labelsAndValues...),
EventsShed: prometheus.NewCounterFrom(stdprometheus.CounterOpts{
Namespace: namespace,
Subsystem: MetricsSubsystem,
Name: "events_shed",
Help: "Events dropped from sending.",
}, labels).With(labelsAndValues...),
}
}
// NopMetrics returns no-op Metrics.
func NopMetrics() *Metrics {
return &Metrics{
EventsIn: discard.NewCounter(),
EventsHandled: discard.NewCounter(),
EventsOut: discard.NewCounter(),
ErrorsIn: discard.NewCounter(),
ErrorsHandled: discard.NewCounter(),
ErrorsOut: discard.NewCounter(),
EventsShed: discard.NewCounter(),
EventsSent: discard.NewCounter(),
ErrorsSent: discard.NewCounter(),
ErrorsShed: discard.NewCounter(),
}
}

View File

@ -8,23 +8,25 @@ import (
) )
// TODO // TODO
// metrics // * revisit panic conditions
// revisit panic conditions // * audit log levels
// audit log levels // * maybe routine should be an interface and the concret tpe should be handlerRoutine
// maybe routine should be an interface and the concret tpe should be handlerRoutine
// Adding Metrics
// we need a metrics definition
type handleFunc = func(event Event) (Events, error) type handleFunc = func(event Event) (Events, error)
type Routine struct { type Routine struct {
name string name string
input chan Event input chan Event
errors chan error errors chan error
logger log.Logger
output chan Event output chan Event
stopped chan struct{} stopped chan struct{}
finished chan error finished chan error
running *uint32 running *uint32
handle handleFunc handle handleFunc
logger log.Logger
metrics *Metrics
} }
func newRoutine(name string, output chan Event, handleFunc handleFunc) *Routine { func newRoutine(name string, output chan Event, handleFunc handleFunc) *Routine {
@ -38,6 +40,7 @@ func newRoutine(name string, output chan Event, handleFunc handleFunc) *Routine
finished: make(chan error, 1), finished: make(chan error, 1),
running: new(uint32), running: new(uint32),
logger: log.NewNopLogger(), logger: log.NewNopLogger(),
metrics: NopMetrics(),
} }
} }
@ -45,6 +48,10 @@ func (rt *Routine) setLogger(logger log.Logger) {
rt.logger = logger rt.logger = logger
} }
func (rt *Routine) setMetrics(metrics *Metrics) {
rt.metrics = metrics
}
func (rt *Routine) run() { func (rt *Routine) run() {
rt.logger.Info(fmt.Sprintf("%s: run\n", rt.name)) rt.logger.Info(fmt.Sprintf("%s: run\n", rt.name))
starting := atomic.CompareAndSwapUint32(rt.running, uint32(0), uint32(1)) starting := atomic.CompareAndSwapUint32(rt.running, uint32(0), uint32(1))
@ -58,6 +65,7 @@ func (rt *Routine) run() {
} }
select { select {
case iEvent, ok := <-rt.input: case iEvent, ok := <-rt.input:
rt.metrics.EventsIn.With("routine", rt.name).Add(1)
if !ok { if !ok {
if !errorsDrained { if !errorsDrained {
continue // wait for errors to be drainned continue // wait for errors to be drainned
@ -67,27 +75,31 @@ func (rt *Routine) run() {
return return
} }
oEvents, err := rt.handle(iEvent) oEvents, err := rt.handle(iEvent)
rt.metrics.EventsHandled.With("routine", rt.name).Add(1)
if err != nil { if err != nil {
rt.terminate(err) rt.terminate(err)
return return
} }
rt.metrics.EventsOut.With("routine", rt.name).Add(float64(len(oEvents)))
rt.logger.Info(fmt.Sprintf("%s handled %d events\n", rt.name, len(oEvents))) rt.logger.Info(fmt.Sprintf("%s handled %d events\n", rt.name, len(oEvents)))
for _, event := range oEvents { for _, event := range oEvents {
rt.logger.Info(fmt.Sprintln("writting back to output")) rt.logger.Info(fmt.Sprintln("writting back to output"))
rt.output <- event rt.output <- event
} }
case iEvent, ok := <-rt.errors: case iEvent, ok := <-rt.errors:
rt.metrics.ErrorsIn.With("routine", rt.name).Add(1)
if !ok { if !ok {
rt.logger.Info(fmt.Sprintf("%s: errors closed\n", rt.name)) rt.logger.Info(fmt.Sprintf("%s: errors closed\n", rt.name))
errorsDrained = true errorsDrained = true
continue continue
} }
oEvents, err := rt.handle(iEvent) oEvents, err := rt.handle(iEvent)
rt.metrics.ErrorsHandled.With("routine", rt.name).Add(1)
if err != nil { if err != nil {
rt.terminate(err) rt.terminate(err)
return return
} }
rt.metrics.ErrorsOut.With("routine", rt.name).Add(float64(len(oEvents)))
for _, event := range oEvents { for _, event := range oEvents {
rt.output <- event rt.output <- event
} }
@ -104,16 +116,20 @@ func (rt *Routine) send(event Event) bool {
if err, ok := event.(error); ok { if err, ok := event.(error); ok {
select { select {
case rt.errors <- err: case rt.errors <- err:
rt.metrics.ErrorsSent.With("routine", rt.name).Add(1)
return true return true
default: default:
rt.metrics.ErrorsShed.With("routine", rt.name).Add(1)
rt.logger.Info(fmt.Sprintf("%s: errors channel was full\n", rt.name)) rt.logger.Info(fmt.Sprintf("%s: errors channel was full\n", rt.name))
return false return false
} }
} else { } else {
select { select {
case rt.input <- event: case rt.input <- event:
rt.metrics.EventsSent.With("routine", rt.name).Add(1)
return true return true
default: default:
rt.metrics.EventsShed.With("routine", rt.name).Add(1)
rt.logger.Info(fmt.Sprintf("%s: channel was full\n", rt.name)) rt.logger.Info(fmt.Sprintf("%s: channel was full\n", rt.name))
return false return false
} }