Add more metrics collection

Signed-off-by: Michael Crosby <crosbymichael@gmail.com>
This commit is contained in:
Michael Crosby 2015-12-18 16:54:02 -08:00
parent d08b005ca9
commit 7d4f74474e
7 changed files with 72 additions and 29 deletions

View file

@ -14,6 +14,7 @@ import (
"google.golang.org/grpc" "google.golang.org/grpc"
"github.com/Sirupsen/logrus" "github.com/Sirupsen/logrus"
"github.com/cloudfoundry/gosigar"
"github.com/codegangsta/cli" "github.com/codegangsta/cli"
"github.com/cyberdelia/go-metrics-graphite" "github.com/cyberdelia/go-metrics-graphite"
"github.com/docker/containerd" "github.com/docker/containerd"
@ -150,20 +151,33 @@ func debugMetrics(interval time.Duration, graphiteAddr string) error {
func processMetrics() { func processMetrics() {
var ( var (
g = metrics.NewGauge() g = metrics.NewGauge()
fg = metrics.NewGauge() fg = metrics.NewGauge()
memg = metrics.NewGauge()
) )
metrics.DefaultRegistry.Register("goroutines", g) metrics.DefaultRegistry.Register("goroutines", g)
metrics.DefaultRegistry.Register("fds", fg) metrics.DefaultRegistry.Register("fds", fg)
metrics.DefaultRegistry.Register("memory-used", memg)
collect := func() {
// update number of goroutines
g.Update(int64(runtime.NumGoroutine()))
// collect the number of open fds
fds, err := util.GetOpenFds(os.Getpid())
if err != nil {
logrus.WithField("error", err).Error("get open fd count")
}
fg.Update(int64(fds))
// get the memory used
m := sigar.ProcMem{}
if err := m.Get(os.Getpid()); err != nil {
logrus.WithField("error", err).Error("get pid memory information")
}
memg.Update(int64(m.Size))
}
go func() { go func() {
collect()
for range time.Tick(30 * time.Second) { for range time.Tick(30 * time.Second) {
g.Update(int64(runtime.NumGoroutine())) collect()
fds, err := util.GetOpenFds(os.Getpid())
if err != nil {
logrus.WithField("error", err).Error("get open fd count")
continue
}
fg.Update(int64(fds))
} }
}() }()
} }

View file

@ -1,6 +1,10 @@
package supervisor package supervisor
import "github.com/Sirupsen/logrus" import (
"time"
"github.com/Sirupsen/logrus"
)
type AddProcessEvent struct { type AddProcessEvent struct {
s *Supervisor s *Supervisor
@ -9,6 +13,7 @@ type AddProcessEvent struct {
// TODO: add this to worker for concurrent starts??? maybe not because of races where the container // TODO: add this to worker for concurrent starts??? maybe not because of races where the container
// could be stopped and removed... // could be stopped and removed...
func (h *AddProcessEvent) Handle(e *Event) error { func (h *AddProcessEvent) Handle(e *Event) error {
start := time.Now()
ci, ok := h.s.containers[e.ID] ci, ok := h.s.containers[e.ID]
if !ok { if !ok {
return ErrContainerNotFound return ErrContainerNotFound
@ -32,5 +37,6 @@ func (h *AddProcessEvent) Handle(e *Event) error {
}).Error("log stdio") }).Error("log stdio")
} }
h.s.processes[e.Pid].copier = l h.s.processes[e.Pid].copier = l
ExecProcessTimer.UpdateSince(start)
return nil return nil
} }

View file

@ -1,10 +1,13 @@
package supervisor package supervisor
import "time"
type StartEvent struct { type StartEvent struct {
s *Supervisor s *Supervisor
} }
func (h *StartEvent) Handle(e *Event) error { func (h *StartEvent) Handle(e *Event) error {
start := time.Now()
container, io, err := h.s.runtime.Create(e.ID, e.BundlePath, e.Console) container, io, err := h.s.runtime.Create(e.ID, e.BundlePath, e.Console)
if err != nil { if err != nil {
return err return err
@ -27,5 +30,6 @@ func (h *StartEvent) Handle(e *Event) error {
task.Checkpoint = e.Checkpoint.Name task.Checkpoint = e.Checkpoint.Name
} }
h.s.tasks <- task h.s.tasks <- task
ContainerCreateTimer.UpdateSince(start)
return errDeferedResponse return errDeferedResponse
} }

View file

@ -1,6 +1,8 @@
package supervisor package supervisor
import ( import (
"time"
"github.com/Sirupsen/logrus" "github.com/Sirupsen/logrus"
"github.com/docker/containerd/runtime" "github.com/docker/containerd/runtime"
) )
@ -11,6 +13,7 @@ type DeleteEvent struct {
func (h *DeleteEvent) Handle(e *Event) error { func (h *DeleteEvent) Handle(e *Event) error {
if i, ok := h.s.containers[e.ID]; ok { if i, ok := h.s.containers[e.ID]; ok {
start := time.Now()
if err := h.deleteContainer(i.container); err != nil { if err := h.deleteContainer(i.container); err != nil {
logrus.WithField("error", err).Error("containerd: deleting container") logrus.WithField("error", err).Error("containerd: deleting container")
} }
@ -27,6 +30,7 @@ func (h *DeleteEvent) Handle(e *Event) error {
}) })
ContainersCounter.Dec(1) ContainersCounter.Dec(1)
h.s.containerGroup.Done() h.s.containerGroup.Done()
ContainerDeleteTimer.UpdateSince(start)
} }
return nil return nil
} }

View file

@ -1,12 +1,17 @@
package supervisor package supervisor
import "github.com/Sirupsen/logrus" import (
"time"
"github.com/Sirupsen/logrus"
)
type ExitEvent struct { type ExitEvent struct {
s *Supervisor s *Supervisor
} }
func (h *ExitEvent) Handle(e *Event) error { func (h *ExitEvent) Handle(e *Event) error {
start := time.Now()
logrus.WithFields(logrus.Fields{"pid": e.Pid, "status": e.Status}). logrus.WithFields(logrus.Fields{"pid": e.Pid, "status": e.Status}).
Debug("containerd: process exited") Debug("containerd: process exited")
// is it the child process of a container // is it the child process of a container
@ -36,6 +41,7 @@ func (h *ExitEvent) Handle(e *Event) error {
stopCollect := NewEvent(StopStatsEventType) stopCollect := NewEvent(StopStatsEventType)
stopCollect.ID = container.ID() stopCollect.ID = container.ID()
h.s.SendEvent(stopCollect) h.s.SendEvent(stopCollect)
ExitProcessTimer.UpdateSince(start)
return nil return nil
} }

27
supervisor/metrics.go Normal file
View file

@ -0,0 +1,27 @@
package supervisor
import "github.com/rcrowley/go-metrics"
var (
ContainerCreateTimer = metrics.NewTimer()
ContainerDeleteTimer = metrics.NewTimer()
ContainerStartTimer = metrics.NewTimer()
ContainersCounter = metrics.NewCounter()
EventSubscriberCounter = metrics.NewCounter()
EventsCounter = metrics.NewCounter()
ExecProcessTimer = metrics.NewTimer()
ExitProcessTimer = metrics.NewTimer()
)
func Metrics() map[string]interface{} {
return map[string]interface{}{
"container-create-time": ContainerCreateTimer,
"container-delete-time": ContainerDeleteTimer,
"container-start-time": ContainerStartTimer,
"containers": ContainersCounter,
"event-subscribers": EventSubscriberCounter,
"events": EventsCounter,
"exec-process-time": ExecProcessTimer,
"exit-process-time": ExitProcessTimer,
}
}

View file

@ -1,23 +1,5 @@
package supervisor package supervisor
import "github.com/rcrowley/go-metrics"
var (
ContainerStartTimer = metrics.NewTimer()
ContainersCounter = metrics.NewCounter()
EventsCounter = metrics.NewCounter()
EventSubscriberCounter = metrics.NewCounter()
)
func Metrics() map[string]interface{} {
return map[string]interface{}{
"container-start-time": ContainerStartTimer,
"containers": ContainersCounter,
"events": EventsCounter,
"events-subscribers": EventSubscriberCounter,
}
}
type StatsEvent struct { type StatsEvent struct {
s *Supervisor s *Supervisor
} }